From ee772aaf0f7a05fafb3fa286419148211362b0d6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 27 Feb 2024 23:17:11 +0100
Subject: [PATCH 001/289] Use clang-18 in CI

---
 .github/workflows/nightly.yml                 |  4 +-
 docker/packager/README.md                     |  8 ++--
 docker/packager/packager                      | 24 +++++------
 docker/test/fuzzer/run-fuzzer.sh              |  2 +-
 docker/test/keeper-jepsen/run.sh              |  2 +-
 docker/test/server-jepsen/run.sh              |  2 +-
 docker/test/sqltest/run.sh                    |  2 +-
 docker/test/util/Dockerfile                   |  2 +-
 docs/en/development/build-cross-osx.md        |  6 +--
 docs/en/development/build-cross-riscv.md      |  2 +-
 docs/en/development/build.md                  |  6 +--
 docs/en/development/continuous-integration.md |  4 +-
 docs/en/development/developer-instruction.md  |  2 +-
 tests/ci/ci_config.py                         | 42 +++++++++----------
 14 files changed, 54 insertions(+), 54 deletions(-)

diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
index 93ac2be19b4..4f7915acd28 100644
--- a/.github/workflows/nightly.yml
+++ b/.github/workflows/nightly.yml
@@ -51,8 +51,8 @@ jobs:
       SONAR_SCANNER_VERSION: 4.8.0.2856
       SONAR_SERVER_URL: "https://sonarcloud.io"
       BUILD_WRAPPER_OUT_DIR: build_wrapper_output_directory # Directory where build-wrapper output will be placed
-      CC: clang-17
-      CXX: clang++-17
+      CC: clang-18
+      CXX: clang++-18
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
diff --git a/docker/packager/README.md b/docker/packager/README.md
index e0b7f38ea58..efc79f2e131 100644
--- a/docker/packager/README.md
+++ b/docker/packager/README.md
@@ -3,10 +3,10 @@ compilers and build settings. Correctly configured Docker daemon is single depen
 
 Usage:
 
-Build deb package with `clang-17` in `debug` mode:
+Build deb package with `clang-18` in `debug` mode:
 ```
 $ mkdir deb/test_output
-$ ./packager --output-dir deb/test_output/ --package-type deb --compiler=clang-17 --debug-build
+$ ./packager --output-dir deb/test_output/ --package-type deb --compiler=clang-18 --debug-build
 $ ls -l deb/test_output
 -rw-r--r-- 1 root root      3730 clickhouse-client_22.2.2+debug_all.deb
 -rw-r--r-- 1 root root  84221888 clickhouse-common-static_22.2.2+debug_amd64.deb
@@ -17,11 +17,11 @@ $ ls -l deb/test_output
 
 ```
 
-Build ClickHouse binary with `clang-17` and `address` sanitizer in `relwithdebuginfo`
+Build ClickHouse binary with `clang-18` and `address` sanitizer in `relwithdebuginfo`
 mode:
 ```
 $ mkdir $HOME/some_clickhouse
-$ ./packager --output-dir=$HOME/some_clickhouse --package-type binary --compiler=clang-17 --sanitizer=address
+$ ./packager --output-dir=$HOME/some_clickhouse --package-type binary --compiler=clang-18 --sanitizer=address
 $ ls -l $HOME/some_clickhouse
 -rwxr-xr-x 1 root root 787061952  clickhouse
 lrwxrwxrwx 1 root root        10  clickhouse-benchmark -> clickhouse
diff --git a/docker/packager/packager b/docker/packager/packager
index ca0ae8358f3..43391af8660 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -403,19 +403,19 @@ def parse_args() -> argparse.Namespace:
     parser.add_argument(
         "--compiler",
         choices=(
-            "clang-17",
-            "clang-17-darwin",
-            "clang-17-darwin-aarch64",
-            "clang-17-aarch64",
-            "clang-17-aarch64-v80compat",
-            "clang-17-ppc64le",
-            "clang-17-riscv64",
-            "clang-17-s390x",
-            "clang-17-amd64-compat",
-            "clang-17-amd64-musl",
-            "clang-17-freebsd",
+            "clang-18",
+            "clang-18-darwin",
+            "clang-18-darwin-aarch64",
+            "clang-18-aarch64",
+            "clang-18-aarch64-v80compat",
+            "clang-18-ppc64le",
+            "clang-18-riscv64",
+            "clang-18-s390x",
+            "clang-18-amd64-compat",
+            "clang-18-amd64-musl",
+            "clang-18-freebsd",
         ),
-        default="clang-17",
+        default="clang-18",
         help="a compiler to use",
     )
     parser.add_argument(
diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index b4376fe2409..9e950668b00 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -17,7 +17,7 @@ stage=${stage:-}
 script_dir="$( cd "$( dirname "${BASH_SOURCE[0]}" )" >/dev/null 2>&1 && pwd )"
 echo "$script_dir"
 repo_dir=ch
-BINARY_TO_DOWNLOAD=${BINARY_TO_DOWNLOAD:="clang-17_debug_none_unsplitted_disable_False_binary"}
+BINARY_TO_DOWNLOAD=${BINARY_TO_DOWNLOAD:="clang-18_debug_none_unsplitted_disable_False_binary"}
 BINARY_URL_TO_DOWNLOAD=${BINARY_URL_TO_DOWNLOAD:="https://clickhouse-builds.s3.amazonaws.com/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/$BINARY_TO_DOWNLOAD/clickhouse"}
 
 function git_clone_with_retry
diff --git a/docker/test/keeper-jepsen/run.sh b/docker/test/keeper-jepsen/run.sh
index 576a0f0ef8e..444f3cd0de7 100644
--- a/docker/test/keeper-jepsen/run.sh
+++ b/docker/test/keeper-jepsen/run.sh
@@ -2,7 +2,7 @@
 set -euo pipefail
 
 
-CLICKHOUSE_PACKAGE=${CLICKHOUSE_PACKAGE:="https://clickhouse-builds.s3.amazonaws.com/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/clang-17_relwithdebuginfo_none_unsplitted_disable_False_binary/clickhouse"}
+CLICKHOUSE_PACKAGE=${CLICKHOUSE_PACKAGE:="https://clickhouse-builds.s3.amazonaws.com/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/clang-18_relwithdebuginfo_none_unsplitted_disable_False_binary/clickhouse"}
 CLICKHOUSE_REPO_PATH=${CLICKHOUSE_REPO_PATH:=""}
 
 
diff --git a/docker/test/server-jepsen/run.sh b/docker/test/server-jepsen/run.sh
index 81e442e65b6..6ea9c03b954 100644
--- a/docker/test/server-jepsen/run.sh
+++ b/docker/test/server-jepsen/run.sh
@@ -2,7 +2,7 @@
 set -euo pipefail
 
 
-CLICKHOUSE_PACKAGE=${CLICKHOUSE_PACKAGE:="https://clickhouse-builds.s3.amazonaws.com/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/clang-17_relwithdebuginfo_none_unsplitted_disable_False_binary/clickhouse"}
+CLICKHOUSE_PACKAGE=${CLICKHOUSE_PACKAGE:="https://clickhouse-builds.s3.amazonaws.com/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/clang-18_relwithdebuginfo_none_unsplitted_disable_False_binary/clickhouse"}
 CLICKHOUSE_REPO_PATH=${CLICKHOUSE_REPO_PATH:=""}
 
 
diff --git a/docker/test/sqltest/run.sh b/docker/test/sqltest/run.sh
index 1d939805c7b..7edc1341d7d 100755
--- a/docker/test/sqltest/run.sh
+++ b/docker/test/sqltest/run.sh
@@ -6,7 +6,7 @@ set -e
 set -u
 set -o pipefail
 
-BINARY_TO_DOWNLOAD=${BINARY_TO_DOWNLOAD:="clang-17_debug_none_unsplitted_disable_False_binary"}
+BINARY_TO_DOWNLOAD=${BINARY_TO_DOWNLOAD:="clang-18_debug_none_unsplitted_disable_False_binary"}
 BINARY_URL_TO_DOWNLOAD=${BINARY_URL_TO_DOWNLOAD:="https://clickhouse-builds.s3.amazonaws.com/$PR_TO_TEST/$SHA_TO_TEST/clickhouse_build_check/$BINARY_TO_DOWNLOAD/clickhouse"}
 
 function wget_with_retry
diff --git a/docker/test/util/Dockerfile b/docker/test/util/Dockerfile
index 396d5801be9..a5057f024b8 100644
--- a/docker/test/util/Dockerfile
+++ b/docker/test/util/Dockerfile
@@ -5,7 +5,7 @@ FROM ubuntu:22.04
 ARG apt_archive="http://archive.ubuntu.com"
 RUN sed -i "s|http://archive.ubuntu.com|$apt_archive|g" /etc/apt/sources.list
 
-ENV DEBIAN_FRONTEND=noninteractive LLVM_VERSION=17
+ENV DEBIAN_FRONTEND=noninteractive LLVM_VERSION=18
 
 RUN apt-get update \
     && apt-get install \
diff --git a/docs/en/development/build-cross-osx.md b/docs/en/development/build-cross-osx.md
index eddf24448c1..66c6e2c6912 100644
--- a/docs/en/development/build-cross-osx.md
+++ b/docs/en/development/build-cross-osx.md
@@ -13,14 +13,14 @@ The cross-build for macOS is based on the [Build instructions](../development/bu
 
 The following sections provide a walk-through for building ClickHouse for `x86_64` macOS. If you’re targeting ARM architecture, simply substitute all occurrences of `x86_64` with `aarch64`. For example, replace `x86_64-apple-darwin` with `aarch64-apple-darwin` throughout the steps.
 
-## Install Clang-17
+## Install clang-18
 
 Follow the instructions from https://apt.llvm.org/ for your Ubuntu or Debian setup.
 For example the commands for Bionic are like:
 
 ``` bash
 sudo echo "deb [trusted=yes] http://apt.llvm.org/bionic/ llvm-toolchain-bionic-17 main" >> /etc/apt/sources.list
-sudo apt-get install clang-17
+sudo apt-get install clang-18
 ```
 
 ## Install Cross-Compilation Toolset {#install-cross-compilation-toolset}
@@ -59,7 +59,7 @@ curl -L 'https://github.com/phracker/MacOSX-SDKs/releases/download/11.3/MacOSX11
 cd ClickHouse
 mkdir build-darwin
 cd build-darwin
-CC=clang-17 CXX=clang++-17 cmake -DCMAKE_AR:FILEPATH=${CCTOOLS}/bin/x86_64-apple-darwin-ar -DCMAKE_INSTALL_NAME_TOOL=${CCTOOLS}/bin/x86_64-apple-darwin-install_name_tool -DCMAKE_RANLIB:FILEPATH=${CCTOOLS}/bin/x86_64-apple-darwin-ranlib -DLINKER_NAME=${CCTOOLS}/bin/x86_64-apple-darwin-ld -DCMAKE_TOOLCHAIN_FILE=cmake/darwin/toolchain-x86_64.cmake ..
+CC=clang-18 CXX=clang++-18 cmake -DCMAKE_AR:FILEPATH=${CCTOOLS}/bin/x86_64-apple-darwin-ar -DCMAKE_INSTALL_NAME_TOOL=${CCTOOLS}/bin/x86_64-apple-darwin-install_name_tool -DCMAKE_RANLIB:FILEPATH=${CCTOOLS}/bin/x86_64-apple-darwin-ranlib -DLINKER_NAME=${CCTOOLS}/bin/x86_64-apple-darwin-ld -DCMAKE_TOOLCHAIN_FILE=cmake/darwin/toolchain-x86_64.cmake ..
 ninja
 ```
 
diff --git a/docs/en/development/build-cross-riscv.md b/docs/en/development/build-cross-riscv.md
index 9ee5346f258..759d97823e2 100644
--- a/docs/en/development/build-cross-riscv.md
+++ b/docs/en/development/build-cross-riscv.md
@@ -23,7 +23,7 @@ sudo bash -c "$(wget -O - https://apt.llvm.org/llvm.sh)"
 ``` bash
 cd ClickHouse
 mkdir build-riscv64
-CC=clang-17 CXX=clang++-17 cmake . -Bbuild-riscv64 -G Ninja -DCMAKE_TOOLCHAIN_FILE=cmake/linux/toolchain-riscv64.cmake -DGLIBC_COMPATIBILITY=OFF -DENABLE_LDAP=OFF  -DOPENSSL_NO_ASM=ON -DENABLE_JEMALLOC=ON -DENABLE_PARQUET=OFF -DENABLE_GRPC=OFF -DENABLE_HDFS=OFF -DENABLE_MYSQL=OFF
+CC=clang-18 CXX=clang++-18 cmake . -Bbuild-riscv64 -G Ninja -DCMAKE_TOOLCHAIN_FILE=cmake/linux/toolchain-riscv64.cmake -DGLIBC_COMPATIBILITY=OFF -DENABLE_LDAP=OFF  -DOPENSSL_NO_ASM=ON -DENABLE_JEMALLOC=ON -DENABLE_PARQUET=OFF -DENABLE_GRPC=OFF -DENABLE_HDFS=OFF -DENABLE_MYSQL=OFF
 ninja -C build-riscv64
 ```
 
diff --git a/docs/en/development/build.md b/docs/en/development/build.md
index b474c445604..e4d0fb146ef 100644
--- a/docs/en/development/build.md
+++ b/docs/en/development/build.md
@@ -67,8 +67,8 @@ to see what version you have installed before setting this environment variable.
 :::
 
 ``` bash
-export CC=clang-17
-export CXX=clang++-17
+export CC=clang-18
+export CXX=clang++-18
 ```
 
 ### Checkout ClickHouse Sources {#checkout-clickhouse-sources}
@@ -105,7 +105,7 @@ The build requires the following components:
 
 - Git (used to checkout the sources, not needed for the build)
 - CMake 3.20 or newer
-- Compiler: clang-17 or newer
+- Compiler: clang-18 or newer
 - Linker: lld-17 or newer
 - Ninja
 - Yasm
diff --git a/docs/en/development/continuous-integration.md b/docs/en/development/continuous-integration.md
index 46a30f56f11..91253ca5e44 100644
--- a/docs/en/development/continuous-integration.md
+++ b/docs/en/development/continuous-integration.md
@@ -153,7 +153,7 @@ Builds ClickHouse in various configurations for use in further steps. You have t
 
 ### Report Details
 
-- **Compiler**: `clang-17`, optionally with the name of a target platform
+- **Compiler**: `clang-18`, optionally with the name of a target platform
 - **Build type**: `Debug` or `RelWithDebInfo` (cmake).
 - **Sanitizer**: `none` (without sanitizers), `address` (ASan), `memory` (MSan), `undefined` (UBSan), or `thread` (TSan).
 - **Status**: `success` or `fail`
@@ -177,7 +177,7 @@ Performs static analysis and code style checks using `clang-tidy`. The report is
 There is a convenience `packager` script that runs the clang-tidy build in docker
 ```sh
 mkdir build_tidy
-./docker/packager/packager --output-dir=./build_tidy --package-type=binary --compiler=clang-17 --debug-build --clang-tidy
+./docker/packager/packager --output-dir=./build_tidy --package-type=binary --compiler=clang-18 --debug-build --clang-tidy
 ```
 
 
diff --git a/docs/en/development/developer-instruction.md b/docs/en/development/developer-instruction.md
index e08096d8042..44a5af5911a 100644
--- a/docs/en/development/developer-instruction.md
+++ b/docs/en/development/developer-instruction.md
@@ -115,7 +115,7 @@ While inside the `build` directory, configure your build by running CMake. Befor
     export CC=clang CXX=clang++
     cmake ..
 
-If you installed clang using the automatic installation script above, also specify the version of clang installed in the first command, e.g. `export CC=clang-17 CXX=clang++-17`. The clang version will be in the script output.
+If you installed clang using the automatic installation script above, also specify the version of clang installed in the first command, e.g. `export CC=clang-18 CXX=clang++-18`. The clang version will be in the script output.
 
 The `CC` variable specifies the compiler for C (short for C Compiler), and `CXX` variable instructs which C++ compiler is to be used for building.
 
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 80994f71280..4757341ce7c 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -670,63 +670,63 @@ CI_CONFIG = CIConfig(
     build_config={
         Build.PACKAGE_RELEASE: BuildConfig(
             name=Build.PACKAGE_RELEASE,
-            compiler="clang-17",
+            compiler="clang-18",
             package_type="deb",
             static_binary_name="amd64",
             additional_pkgs=True,
         ),
         Build.PACKAGE_AARCH64: BuildConfig(
             name=Build.PACKAGE_AARCH64,
-            compiler="clang-17-aarch64",
+            compiler="clang-18-aarch64",
             package_type="deb",
             static_binary_name="aarch64",
             additional_pkgs=True,
         ),
         Build.PACKAGE_ASAN: BuildConfig(
             name=Build.PACKAGE_ASAN,
-            compiler="clang-17",
+            compiler="clang-18",
             sanitizer="address",
             package_type="deb",
         ),
         Build.PACKAGE_UBSAN: BuildConfig(
             name=Build.PACKAGE_UBSAN,
-            compiler="clang-17",
+            compiler="clang-18",
             sanitizer="undefined",
             package_type="deb",
         ),
         Build.PACKAGE_TSAN: BuildConfig(
             name=Build.PACKAGE_TSAN,
-            compiler="clang-17",
+            compiler="clang-18",
             sanitizer="thread",
             package_type="deb",
         ),
         Build.PACKAGE_MSAN: BuildConfig(
             name=Build.PACKAGE_MSAN,
-            compiler="clang-17",
+            compiler="clang-18",
             sanitizer="memory",
             package_type="deb",
         ),
         Build.PACKAGE_DEBUG: BuildConfig(
             name=Build.PACKAGE_DEBUG,
-            compiler="clang-17",
+            compiler="clang-18",
             debug_build=True,
             package_type="deb",
             sparse_checkout=True,  # Check that it works with at least one build, see also update-submodules.sh
         ),
         Build.PACKAGE_RELEASE_COVERAGE: BuildConfig(
             name=Build.PACKAGE_RELEASE_COVERAGE,
-            compiler="clang-17",
+            compiler="clang-18",
             coverage=True,
             package_type="deb",
         ),
         Build.BINARY_RELEASE: BuildConfig(
             name=Build.BINARY_RELEASE,
-            compiler="clang-17",
+            compiler="clang-18",
             package_type="binary",
         ),
         Build.BINARY_TIDY: BuildConfig(
             name=Build.BINARY_TIDY,
-            compiler="clang-17",
+            compiler="clang-18",
             debug_build=True,
             package_type="binary",
             static_binary_name="debug-amd64",
@@ -735,69 +735,69 @@ CI_CONFIG = CIConfig(
         ),
         Build.BINARY_DARWIN: BuildConfig(
             name=Build.BINARY_DARWIN,
-            compiler="clang-17-darwin",
+            compiler="clang-18-darwin",
             package_type="binary",
             static_binary_name="macos",
         ),
         Build.BINARY_AARCH64: BuildConfig(
             name=Build.BINARY_AARCH64,
-            compiler="clang-17-aarch64",
+            compiler="clang-18-aarch64",
             package_type="binary",
         ),
         Build.BINARY_AARCH64_V80COMPAT: BuildConfig(
             name=Build.BINARY_AARCH64_V80COMPAT,
-            compiler="clang-17-aarch64-v80compat",
+            compiler="clang-18-aarch64-v80compat",
             package_type="binary",
             static_binary_name="aarch64v80compat",
             comment="For ARMv8.1 and older",
         ),
         Build.BINARY_FREEBSD: BuildConfig(
             name=Build.BINARY_FREEBSD,
-            compiler="clang-17-freebsd",
+            compiler="clang-18-freebsd",
             package_type="binary",
             static_binary_name="freebsd",
         ),
         Build.BINARY_DARWIN_AARCH64: BuildConfig(
             name=Build.BINARY_DARWIN_AARCH64,
-            compiler="clang-17-darwin-aarch64",
+            compiler="clang-18-darwin-aarch64",
             package_type="binary",
             static_binary_name="macos-aarch64",
         ),
         Build.BINARY_PPC64LE: BuildConfig(
             name=Build.BINARY_PPC64LE,
-            compiler="clang-17-ppc64le",
+            compiler="clang-18-ppc64le",
             package_type="binary",
             static_binary_name="powerpc64le",
         ),
         Build.BINARY_AMD64_COMPAT: BuildConfig(
             name=Build.BINARY_AMD64_COMPAT,
-            compiler="clang-17-amd64-compat",
+            compiler="clang-18-amd64-compat",
             package_type="binary",
             static_binary_name="amd64compat",
             comment="SSE2-only build",
         ),
         Build.BINARY_AMD64_MUSL: BuildConfig(
             name=Build.BINARY_AMD64_MUSL,
-            compiler="clang-17-amd64-musl",
+            compiler="clang-18-amd64-musl",
             package_type="binary",
             static_binary_name="amd64musl",
             comment="Build with Musl",
         ),
         Build.BINARY_RISCV64: BuildConfig(
             name=Build.BINARY_RISCV64,
-            compiler="clang-17-riscv64",
+            compiler="clang-18-riscv64",
             package_type="binary",
             static_binary_name="riscv64",
         ),
         Build.BINARY_S390X: BuildConfig(
             name=Build.BINARY_S390X,
-            compiler="clang-17-s390x",
+            compiler="clang-18-s390x",
             package_type="binary",
             static_binary_name="s390x",
         ),
         Build.FUZZERS: BuildConfig(
             name=Build.FUZZERS,
-            compiler="clang-17",
+            compiler="clang-18",
             package_type="fuzzers",
             job_config=JobConfig(run_by_label=Labels.libFuzzer),
         ),

From aaec92f860c92f403c2f79fb9f724102487ed903 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 3 Mar 2024 23:02:55 +0100
Subject: [PATCH 002/289] Address review comments

---
 cmake/tools.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmake/tools.cmake b/cmake/tools.cmake
index 1ba3007b0f3..789dc76e6fa 100644
--- a/cmake/tools.cmake
+++ b/cmake/tools.cmake
@@ -13,7 +13,7 @@ execute_process(COMMAND ${CMAKE_CXX_COMPILER} --version OUTPUT_VARIABLE COMPILER
 message (STATUS "Using compiler:\n${COMPILER_SELF_IDENTIFICATION}")
 
 # Require minimum compiler versions
-set (CLANG_MINIMUM_VERSION 16)
+set (CLANG_MINIMUM_VERSION 17)
 set (XCODE_MINIMUM_VERSION 12.0)
 set (APPLE_CLANG_MINIMUM_VERSION 12.0.0)
 

From 8d25f27b1901d4d4999558b987a415c4c289e2ba Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 3 Mar 2024 23:07:05 +0100
Subject: [PATCH 003/289] Fix UBSan report

---
 src/Compression/CompressionCodecDoubleDelta.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Compression/CompressionCodecDoubleDelta.cpp b/src/Compression/CompressionCodecDoubleDelta.cpp
index 99089ed6770..fe18578eb2a 100644
--- a/src/Compression/CompressionCodecDoubleDelta.cpp
+++ b/src/Compression/CompressionCodecDoubleDelta.cpp
@@ -343,7 +343,7 @@ UInt32 compressDataForType(const char * source, UInt32 source_size, char * dest)
             const auto sign = signed_dd < 0;
 
             // -1 shrinks dd down to fit into number of bits, and there can't be 0, so it is OK.
-            const auto abs_value = static_cast<UnsignedDeltaType>(std::abs(signed_dd) - 1);
+            const auto abs_value = (sign ? -static_cast<UnsignedDeltaType>(signed_dd) : static_cast<UnsignedDeltaType>(signed_dd)) - 1;
             const auto write_spec = getDeltaWriteSpec(signed_dd);
 
             writer.writeBits(write_spec.prefix_bits, write_spec.prefix);

From b3a43346b110ecbdbbc9d8c025fee09b4b35e2b6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 06:59:42 +0100
Subject: [PATCH 004/289] Revert "Fix UBSan report"

This reverts commit 8d25f27b1901d4d4999558b987a415c4c289e2ba.
---
 src/Compression/CompressionCodecDoubleDelta.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Compression/CompressionCodecDoubleDelta.cpp b/src/Compression/CompressionCodecDoubleDelta.cpp
index fe18578eb2a..99089ed6770 100644
--- a/src/Compression/CompressionCodecDoubleDelta.cpp
+++ b/src/Compression/CompressionCodecDoubleDelta.cpp
@@ -343,7 +343,7 @@ UInt32 compressDataForType(const char * source, UInt32 source_size, char * dest)
             const auto sign = signed_dd < 0;
 
             // -1 shrinks dd down to fit into number of bits, and there can't be 0, so it is OK.
-            const auto abs_value = (sign ? -static_cast<UnsignedDeltaType>(signed_dd) : static_cast<UnsignedDeltaType>(signed_dd)) - 1;
+            const auto abs_value = static_cast<UnsignedDeltaType>(std::abs(signed_dd) - 1);
             const auto write_spec = getDeltaWriteSpec(signed_dd);
 
             writer.writeBits(write_spec.prefix_bits, write_spec.prefix);

From 4e8a363b34380a914a326cadff5f9f796837eb70 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 07:32:47 +0100
Subject: [PATCH 005/289] Fix something entirely wrong in DoubleDelta

---
 src/Compression/CompressionCodecDoubleDelta.cpp | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/Compression/CompressionCodecDoubleDelta.cpp b/src/Compression/CompressionCodecDoubleDelta.cpp
index 99089ed6770..e6e8db4c699 100644
--- a/src/Compression/CompressionCodecDoubleDelta.cpp
+++ b/src/Compression/CompressionCodecDoubleDelta.cpp
@@ -343,7 +343,10 @@ UInt32 compressDataForType(const char * source, UInt32 source_size, char * dest)
             const auto sign = signed_dd < 0;
 
             // -1 shrinks dd down to fit into number of bits, and there can't be 0, so it is OK.
-            const auto abs_value = static_cast<UnsignedDeltaType>(std::abs(signed_dd) - 1);
+            const auto abs_value =
+                signed_dd == std::numeric_limits<SignedDeltaType>::min()
+                    ? (static_cast<UnsignedDeltaType>(-1) >> 1)
+                    : static_cast<UnsignedDeltaType>(std::abs(signed_dd) - 1);
             const auto write_spec = getDeltaWriteSpec(signed_dd);
 
             writer.writeBits(write_spec.prefix_bits, write_spec.prefix);

From 9bb32dc78fa7872cb965d087e64050c091688777 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 09:22:14 +0100
Subject: [PATCH 006/289] Loosen

---
 CMakeLists.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index b55e9810361..9ffb4789dc9 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -61,8 +61,8 @@ if (ENABLE_CHECK_HEAVY_BUILDS)
     # set CPU time limit to 1000 seconds
     set (RLIMIT_CPU 1000)
 
-    # -fsanitize=memory is too heavy
-    if (SANITIZE STREQUAL "memory")
+    # -fsanitize=memory and address are too heavy
+    if (SANITIZE)
        set (RLIMIT_DATA 10000000000) # 10G
     endif()
 

From 2ff1368678504b3100e7c0f4dc8496e4bfdc9539 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 09:37:17 +0100
Subject: [PATCH 007/289] Fix FreeBSD

---
 src/Common/waitForPid.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/waitForPid.cpp b/src/Common/waitForPid.cpp
index 0ec10811354..894406f69b5 100644
--- a/src/Common/waitForPid.cpp
+++ b/src/Common/waitForPid.cpp
@@ -144,7 +144,7 @@ static PollPidResult pollPid(pid_t pid, int timeout_in_ms)
         return PollPidResult::FAILED;
     }
 
-    struct kevent event = {.ident = 0};
+    struct kevent event{};
     struct timespec remaining_timespec = {.tv_sec = timeout_in_ms / 1000, .tv_nsec = (timeout_in_ms % 1000) * 1000000};
     int ready = HANDLE_EINTR(kevent(kq, nullptr, 0, &event, 1, &remaining_timespec));
     PollPidResult result = ready < 0 ? PollPidResult::FAILED : PollPidResult::RESTART;

From 480ae2cd4982fda4fa3f24e494faa8b1848eff59 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 09:39:03 +0100
Subject: [PATCH 008/289] Fix clang-tidy

---
 cmake/clang_tidy.cmake | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cmake/clang_tidy.cmake b/cmake/clang_tidy.cmake
index 4323c20463a..4c9331f6283 100644
--- a/cmake/clang_tidy.cmake
+++ b/cmake/clang_tidy.cmake
@@ -5,14 +5,14 @@ if (ENABLE_CLANG_TIDY)
 
     find_program (CLANG_TIDY_CACHE_PATH NAMES "clang-tidy-cache")
     if (CLANG_TIDY_CACHE_PATH)
-        find_program (_CLANG_TIDY_PATH NAMES "clang-tidy-17" "clang-tidy-16" "clang-tidy")
+        find_program (_CLANG_TIDY_PATH NAMES "clang-tidy-18" "clang-tidy-17" "clang-tidy-16" "clang-tidy")
 
         # Why do we use ';' here?
         # It's a cmake black magic: https://cmake.org/cmake/help/latest/prop_tgt/LANG_CLANG_TIDY.html#prop_tgt:%3CLANG%3E_CLANG_TIDY
         # The CLANG_TIDY_PATH is passed to CMAKE_CXX_CLANG_TIDY, which follows CXX_CLANG_TIDY syntax.
         set (CLANG_TIDY_PATH "${CLANG_TIDY_CACHE_PATH};${_CLANG_TIDY_PATH}" CACHE STRING "A combined command to run clang-tidy with caching wrapper")
     else ()
-        find_program (CLANG_TIDY_PATH NAMES "clang-tidy-17" "clang-tidy-16" "clang-tidy")
+        find_program (CLANG_TIDY_PATH NAMES "clang-tidy-18" "clang-tidy-17" "clang-tidy-16" "clang-tidy")
     endif ()
 
     if (CLANG_TIDY_PATH)

From 6a41dbca0bbaae258ee034e271293479a793df9b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 14 Mar 2024 13:08:01 +0100
Subject: [PATCH 009/289] Fix Apple's Macintosh OS X 'darwin'

---
 src/Common/waitForPid.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/waitForPid.cpp b/src/Common/waitForPid.cpp
index 894406f69b5..5fb2c62415b 100644
--- a/src/Common/waitForPid.cpp
+++ b/src/Common/waitForPid.cpp
@@ -132,7 +132,7 @@ static PollPidResult pollPid(pid_t pid, int timeout_in_ms)
     if (kq == -1)
         return PollPidResult::FAILED;
 
-    struct kevent change = {.ident = 0};
+    struct kevent change{};
     EV_SET(&change, pid, EVFILT_PROC, EV_ADD, NOTE_EXIT, 0, NULL);
 
     int event_add_result = HANDLE_EINTR(kevent(kq, &change, 1, NULL, 0, NULL));

From d03ae0655abaef54117f6455063009aa7aed790b Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 20 Mar 2024 16:39:37 +0800
Subject: [PATCH 010/289] finish opt utf8 version of
 substring/substringindex/reverse

---
 src/Common/UTF8Helpers.cpp       | 75 +++++++++++++++++++++++++++++++-
 src/Common/UTF8Helpers.h         |  5 ++-
 src/Functions/reverse.cpp        | 38 +---------------
 src/Functions/reverse.h          | 42 ++++++++++++++++++
 src/Functions/reverseUTF8.cpp    | 12 ++++-
 src/Functions/substring.cpp      | 18 +++++++-
 src/Functions/substringIndex.cpp | 20 +++++++--
 7 files changed, 164 insertions(+), 46 deletions(-)
 create mode 100644 src/Functions/reverse.h

diff --git a/src/Common/UTF8Helpers.cpp b/src/Common/UTF8Helpers.cpp
index 0af31726f40..78d645994e5 100644
--- a/src/Common/UTF8Helpers.cpp
+++ b/src/Common/UTF8Helpers.cpp
@@ -1,9 +1,13 @@
-#include <Common/UTF8Helpers.h>
 #include <Common/StringUtils/StringUtils.h>
+#include <Common/TargetSpecific.h>
+#include <Common/UTF8Helpers.h>
 
 #include <widechar_width.h>
 #include <bit>
 
+#if USE_MULTITARGET_CODE
+#include <immintrin.h>
+#endif
 
 namespace DB
 {
@@ -205,5 +209,74 @@ size_t computeBytesBeforeWidth(const UInt8 * data, size_t size, size_t prefix, s
     return computeWidthImpl<BytesBeforLimit>(data, size, prefix, limit);
 }
 
+
+DECLARE_DEFAULT_CODE(
+bool isAllASCII(const UInt8 * data, size_t size)
+{
+    UInt8 mask = 0;
+    for (size_t i = 0; i < size; ++i)
+        mask |= data[i];
+
+    return !(mask & 0x80);
+})
+
+DECLARE_SSE42_SPECIFIC_CODE(
+/// Copy from https://github.com/lemire/fastvalidate-utf-8/blob/master/include/simdasciicheck.h
+bool isAllASCII(const UInt8 * data, size_t size) {
+    size_t i = 0;
+    __m128i masks = _mm_setzero_si128();
+    if (size >= 16)
+    {
+        for (; i <= size - 16; i += 16)
+        {
+            __m128i bytes = _mm_loadu_si128(reinterpret_cast<const __m128i *>(data + i));
+            masks = _mm_or_si128(masks, bytes);
+        }
+    }
+    int mask = _mm_movemask_epi8(masks);
+
+    UInt8 tail_mask = 0;
+    for (; i < size; i++)
+        tail_mask |= data[i];
+
+    mask |= (tail_mask & 0x80);
+    return !mask;
+})
+
+DECLARE_AVX2_SPECIFIC_CODE(
+bool isAllASCII(const UInt8 * data, size_t size)
+{
+    size_t i = 0;
+    __m256i masks = _mm256_setzero_si256();
+    if (size >= 32)
+    {
+        for (; i <= size - 32; i += 32)
+        {
+            __m256i bytes = _mm256_loadu_si256(reinterpret_cast<const __m256i*>(data + i));
+            masks = _mm256_or_si256(masks, bytes);
+        }
+    }
+    int mask = _mm256_movemask_epi8(masks);
+
+    UInt8 tail_mask = 0;
+    for (; i < size; i++)
+        tail_mask |= data[i];
+
+    mask |= (tail_mask & 0x80);
+    return !mask;
+})
+
+bool isAllASCII(const UInt8* data, size_t size)
+{
+#if USE_MULTITARGET_CODE
+    if (isArchSupported(TargetArch::AVX2))
+        return TargetSpecific::AVX2::isAllASCII(data, size);
+    if (isArchSupported(TargetArch::SSE42))
+        return TargetSpecific::SSE42::isAllASCII(data, size);
+#endif
+    return TargetSpecific::Default::isAllASCII(data, size);
+}
+
+
 }
 }
diff --git a/src/Common/UTF8Helpers.h b/src/Common/UTF8Helpers.h
index a4dd88921b7..933b62c7b63 100644
--- a/src/Common/UTF8Helpers.h
+++ b/src/Common/UTF8Helpers.h
@@ -136,7 +136,10 @@ size_t computeWidth(const UInt8 * data, size_t size, size_t prefix = 0) noexcept
   */
 size_t computeBytesBeforeWidth(const UInt8 * data, size_t size, size_t prefix, size_t limit) noexcept;
 
-}
 
+/// If all the characters in the string are ASCII, return true.
+bool isAllASCII(const UInt8* data, size_t size);
+
+}
 
 }
diff --git a/src/Functions/reverse.cpp b/src/Functions/reverse.cpp
index 32b998523c7..39608b77997 100644
--- a/src/Functions/reverse.cpp
+++ b/src/Functions/reverse.cpp
@@ -1,10 +1,10 @@
 #include <DataTypes/DataTypeString.h>
-#include <Columns/ColumnString.h>
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnArray.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <base/map.h>
+#include "reverse.h"
 
 
 namespace DB
@@ -17,42 +17,6 @@ namespace ErrorCodes
 
 namespace
 {
-
-/** Reverse the string as a sequence of bytes.
-  */
-struct ReverseImpl
-{
-    static void vector(const ColumnString::Chars & data,
-        const ColumnString::Offsets & offsets,
-        ColumnString::Chars & res_data,
-        ColumnString::Offsets & res_offsets)
-    {
-        res_data.resize(data.size());
-        res_offsets.assign(offsets);
-        size_t size = offsets.size();
-
-        ColumnString::Offset prev_offset = 0;
-        for (size_t i = 0; i < size; ++i)
-        {
-            for (size_t j = prev_offset; j < offsets[i] - 1; ++j)
-                res_data[j] = data[offsets[i] + prev_offset - 2 - j];
-            res_data[offsets[i] - 1] = 0;
-            prev_offset = offsets[i];
-        }
-    }
-
-    static void vectorFixed(const ColumnString::Chars & data, size_t n, ColumnString::Chars & res_data)
-    {
-        res_data.resize(data.size());
-        size_t size = data.size() / n;
-
-        for (size_t i = 0; i < size; ++i)
-            for (size_t j = i * n; j < (i + 1) * n; ++j)
-                res_data[j] = data[(i * 2 + 1) * n - j - 1];
-    }
-};
-
-
 class FunctionReverse : public IFunction
 {
 public:
diff --git a/src/Functions/reverse.h b/src/Functions/reverse.h
new file mode 100644
index 00000000000..128a897c041
--- /dev/null
+++ b/src/Functions/reverse.h
@@ -0,0 +1,42 @@
+#pragma once
+
+#include <Columns/ColumnString.h>
+
+namespace DB
+{
+
+/** Reverse the string as a sequence of bytes.
+  */
+struct ReverseImpl
+{
+    static void vector(const ColumnString::Chars & data,
+        const ColumnString::Offsets & offsets,
+        ColumnString::Chars & res_data,
+        ColumnString::Offsets & res_offsets)
+    {
+        res_data.resize(data.size());
+        res_offsets.assign(offsets);
+        size_t size = offsets.size();
+
+        ColumnString::Offset prev_offset = 0;
+        for (size_t i = 0; i < size; ++i)
+        {
+            for (size_t j = prev_offset; j < offsets[i] - 1; ++j)
+                res_data[j] = data[offsets[i] + prev_offset - 2 - j];
+            res_data[offsets[i] - 1] = 0;
+            prev_offset = offsets[i];
+        }
+    }
+
+    static void vectorFixed(const ColumnString::Chars & data, size_t n, ColumnString::Chars & res_data)
+    {
+        res_data.resize(data.size());
+        size_t size = data.size() / n;
+
+        for (size_t i = 0; i < size; ++i)
+            for (size_t j = i * n; j < (i + 1) * n; ++j)
+                res_data[j] = data[(i * 2 + 1) * n - j - 1];
+    }
+};
+
+}
diff --git a/src/Functions/reverseUTF8.cpp b/src/Functions/reverseUTF8.cpp
index 8a76af05d86..4ea861919a1 100644
--- a/src/Functions/reverseUTF8.cpp
+++ b/src/Functions/reverseUTF8.cpp
@@ -1,7 +1,9 @@
-#include <DataTypes/DataTypeString.h>
 #include <Columns/ColumnString.h>
+#include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionStringToString.h>
+#include <Common/UTF8Helpers.h>
+#include "reverse.h"
 
 
 namespace DB
@@ -25,10 +27,18 @@ struct ReverseUTF8Impl
         ColumnString::Chars & res_data,
         ColumnString::Offsets & res_offsets)
     {
+        bool all_ascii = UTF8::isAllASCII(data.data(), data.size());
+        if (all_ascii)
+        {
+            ReverseImpl::vector(data, offsets, res_data, res_offsets);
+            return;
+        }
+
         res_data.resize(data.size());
         res_offsets.assign(offsets);
         size_t size = offsets.size();
 
+
         ColumnString::Offset prev_offset = 0;
         for (size_t i = 0; i < size; ++i)
         {
diff --git a/src/Functions/substring.cpp b/src/Functions/substring.cpp
index e809914f5f0..759d41e2ab8 100644
--- a/src/Functions/substring.cpp
+++ b/src/Functions/substring.cpp
@@ -148,9 +148,23 @@ public:
         if constexpr (is_utf8)
         {
             if (const ColumnString * col = checkAndGetColumn<ColumnString>(column_string.get()))
-                return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, UTF8StringSource(*col), input_rows_count);
+            {
+                bool all_ascii = UTF8::isAllASCII(col->getChars().data(), col->getChars().size());
+                if (all_ascii)
+                    return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, StringSource(*col), input_rows_count);
+                else
+                    return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, UTF8StringSource(*col), input_rows_count);
+            }
+
             if (const ColumnConst * col_const = checkAndGetColumnConst<ColumnString>(column_string.get()))
-                return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<UTF8StringSource>(*col_const), input_rows_count);
+            {
+                StringRef str_ref = col_const->getDataAt(0);
+                bool all_ascii = UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(str_ref.data), str_ref.size);
+                if (all_ascii)
+                    return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<UTF8StringSource>(*col_const), input_rows_count);
+                else
+                    return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<StringSource>(*col_const), input_rows_count);
+            }
             throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}", arguments[0].column->getName(), getName());
         }
         else
diff --git a/src/Functions/substringIndex.cpp b/src/Functions/substringIndex.cpp
index 5f3f054b624..462941b90ec 100644
--- a/src/Functions/substringIndex.cpp
+++ b/src/Functions/substringIndex.cpp
@@ -129,8 +129,10 @@ namespace
             res_data.reserve(str_column->getChars().size() / 2);
             res_offsets.reserve(rows);
 
+            bool all_ascii = UTF8::isAllASCII(str_column->getChars().data(), str_column->getChars().size())
+                && UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(delim.data()), delim.size());
             std::unique_ptr<PositionCaseSensitiveUTF8::SearcherInBigHaystack> searcher
-                = !is_utf8 ? nullptr : std::make_unique<PositionCaseSensitiveUTF8::SearcherInBigHaystack>(delim.data(), delim.size());
+                = !is_utf8 || all_ascii ? nullptr : std::make_unique<PositionCaseSensitiveUTF8::SearcherInBigHaystack>(delim.data(), delim.size());
 
             for (size_t i = 0; i < rows; ++i)
             {
@@ -140,6 +142,8 @@ namespace
                 StringRef res_ref;
                 if constexpr (!is_utf8)
                     res_ref = substringIndex(str_ref, delim[0], count);
+                else if (all_ascii)
+                    res_ref = substringIndex(str_ref, delim[0], count);
                 else
                     res_ref = substringIndexUTF8(searcher.get(), str_ref, delim, count);
 
@@ -158,8 +162,10 @@ namespace
             res_data.reserve(str_column->getChars().size() / 2);
             res_offsets.reserve(rows);
 
+            bool all_ascii = UTF8::isAllASCII(str_column->getChars().data(), str_column->getChars().size())
+                && UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(delim.data()), delim.size());
             std::unique_ptr<PositionCaseSensitiveUTF8::SearcherInBigHaystack> searcher
-                = !is_utf8 ? nullptr : std::make_unique<PositionCaseSensitiveUTF8::SearcherInBigHaystack>(delim.data(), delim.size());
+                = !is_utf8 || all_ascii ? nullptr : std::make_unique<PositionCaseSensitiveUTF8::SearcherInBigHaystack>(delim.data(), delim.size());
 
             for (size_t i = 0; i < rows; ++i)
             {
@@ -168,6 +174,8 @@ namespace
                 StringRef res_ref;
                 if constexpr (!is_utf8)
                     res_ref = substringIndex(str_ref, delim[0], count);
+                else if (all_ascii)
+                    res_ref = substringIndex(str_ref, delim[0], count);
                 else
                     res_ref = substringIndexUTF8(searcher.get(), str_ref, delim, count);
 
@@ -186,8 +194,10 @@ namespace
             res_data.reserve(str.size() * rows / 2);
             res_offsets.reserve(rows);
 
+            bool all_ascii = UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(str.data()), str.size())
+                && UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(delim.data()), delim.size());
             std::unique_ptr<PositionCaseSensitiveUTF8::SearcherInBigHaystack> searcher
-                = !is_utf8 ? nullptr : std::make_unique<PositionCaseSensitiveUTF8::SearcherInBigHaystack>(delim.data(), delim.size());
+                = !is_utf8 || all_ascii ? nullptr : std::make_unique<PositionCaseSensitiveUTF8::SearcherInBigHaystack>(delim.data(), delim.size());
 
             StringRef str_ref{str.data(), str.size()};
             for (size_t i = 0; i < rows; ++i)
@@ -197,6 +207,8 @@ namespace
                 StringRef res_ref;
                 if constexpr (!is_utf8)
                     res_ref = substringIndex(str_ref, delim[0], count);
+                else if (all_ascii)
+                    res_ref = substringIndex(str_ref, delim[0], count);
                 else
                     res_ref = substringIndexUTF8(searcher.get(), str_ref, delim, count);
 
@@ -208,7 +220,7 @@ namespace
         {
             size_t res_offset = res_data.size();
             res_data.resize(res_offset + res_ref.size + 1);
-            memcpy(&res_data[res_offset], res_ref.data, res_ref.size);
+            memcpySmallAllowReadWriteOverflow15(&res_data[res_offset], res_ref.data, res_ref.size);
             res_offset += res_ref.size;
             res_data[res_offset] = 0;
             ++res_offset;

From 75d4cebf7c35ea744816161322f99753bdd65a8c Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 20 Mar 2024 17:20:46 +0800
Subject: [PATCH 011/289] opt lowerUTF8/upperUTF8

---
 src/Functions/LowerUpperImpl.h     |  4 ++--
 src/Functions/LowerUpperUTF8Impl.h | 13 +++++++++++--
 2 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/src/Functions/LowerUpperImpl.h b/src/Functions/LowerUpperImpl.h
index f093e00f7ab..72b3ce1ca34 100644
--- a/src/Functions/LowerUpperImpl.h
+++ b/src/Functions/LowerUpperImpl.h
@@ -13,14 +13,14 @@ struct LowerUpperImpl
         ColumnString::Chars & res_data,
         ColumnString::Offsets & res_offsets)
     {
-        res_data.resize(data.size());
+        res_data.resize_exact(data.size());
         res_offsets.assign(offsets);
         array(data.data(), data.data() + data.size(), res_data.data());
     }
 
     static void vectorFixed(const ColumnString::Chars & data, size_t /*n*/, ColumnString::Chars & res_data)
     {
-        res_data.resize(data.size());
+        res_data.resize_exact(data.size());
         array(data.data(), data.data() + data.size(), res_data.data());
     }
 
diff --git a/src/Functions/LowerUpperUTF8Impl.h b/src/Functions/LowerUpperUTF8Impl.h
index 460f75f9bde..f2a1351c048 100644
--- a/src/Functions/LowerUpperUTF8Impl.h
+++ b/src/Functions/LowerUpperUTF8Impl.h
@@ -1,8 +1,9 @@
 #pragma once
 #include <Columns/ColumnString.h>
+#include <Functions/LowerUpperImpl.h>
+#include <base/defines.h>
 #include <Poco/UTF8Encoding.h>
 #include <Common/UTF8Helpers.h>
-#include <base/defines.h>
 
 #ifdef __SSE2__
 #include <emmintrin.h>
@@ -92,7 +93,15 @@ struct LowerUpperUTF8Impl
     {
         if (data.empty())
             return;
-        res_data.resize(data.size());
+
+        bool all_ascii = UTF8::isAllASCII(data.data(), data.size());
+        if (all_ascii)
+        {
+            LowerUpperImpl<not_case_lower_bound, not_case_upper_bound>::vector(data, offsets, res_data, res_offsets);
+            return;
+        }
+
+        res_data.resize_exact(data.size());
         res_offsets.assign(offsets);
         array(data.data(), data.data() + data.size(), offsets, res_data.data());
     }

From a4466496488d357f6f0049c5906c23893336cad8 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 20 Mar 2024 18:48:51 +0800
Subject: [PATCH 012/289] opt pad string for utf8

---
 src/Functions/GatherUtils/Sinks.h   | 16 +++++-----
 src/Functions/GatherUtils/Sources.h |  9 ++++--
 src/Functions/padString.cpp         | 49 +++++++++++++++++++----------
 src/Functions/reverse.h             |  4 +--
 4 files changed, 49 insertions(+), 29 deletions(-)

diff --git a/src/Functions/GatherUtils/Sinks.h b/src/Functions/GatherUtils/Sinks.h
index a8054da1159..2aa7c147136 100644
--- a/src/Functions/GatherUtils/Sinks.h
+++ b/src/Functions/GatherUtils/Sinks.h
@@ -48,7 +48,7 @@ struct NumericArraySink : public ArraySinkImpl<NumericArraySink<T>>
     NumericArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
             : elements(assert_cast<ColVecType&>(elements_).getData()), offsets(offsets_)
     {
-        offsets.resize(column_size);
+        offsets.resize_exact(column_size);
     }
 
     void next()
@@ -69,7 +69,7 @@ struct NumericArraySink : public ArraySinkImpl<NumericArraySink<T>>
 
     void reserve(size_t num_elements)
     {
-        elements.reserve(num_elements);
+        elements.reserve_exact(num_elements);
     }
 };
 
@@ -85,7 +85,7 @@ struct StringSink
     StringSink(ColumnString & col, size_t column_size)
             : elements(col.getChars()), offsets(col.getOffsets())
     {
-        offsets.resize(column_size);
+        offsets.resize_exact(column_size);
     }
 
     void ALWAYS_INLINE next()
@@ -108,7 +108,7 @@ struct StringSink
 
     void reserve(size_t num_elements)
     {
-        elements.reserve(num_elements);
+        elements.reserve_exact(num_elements);
     }
 };
 
@@ -125,7 +125,7 @@ struct FixedStringSink
     FixedStringSink(ColumnFixedString & col, size_t column_size)
             : elements(col.getChars()), string_size(col.getN()), total_rows(column_size)
     {
-        elements.resize(column_size * string_size);
+        elements.resize_exact(column_size * string_size);
     }
 
     void next()
@@ -146,7 +146,7 @@ struct FixedStringSink
 
     void reserve(size_t num_elements)
     {
-        elements.reserve(num_elements);
+        elements.reserve_exact(num_elements);
     }
 };
 
@@ -165,7 +165,7 @@ struct GenericArraySink : public ArraySinkImpl<GenericArraySink>
     GenericArraySink(IColumn & elements_, ColumnArray::Offsets & offsets_, size_t column_size)
             : elements(elements_), offsets(offsets_)
     {
-        offsets.resize(column_size);
+        offsets.resize_exact(column_size);
     }
 
     void next()
@@ -210,7 +210,7 @@ struct NullableArraySink : public ArraySink
     void reserve(size_t num_elements)
     {
         ArraySink::reserve(num_elements);
-        null_map.reserve(num_elements);
+        null_map.reserve_exact(num_elements);
     }
 };
 
diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 222f9f19168..41e38e6fa79 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -319,6 +319,8 @@ struct StringSource
             return {&elements[prev_offset], length + elem_size > offset ? std::min(elem_size, length + elem_size - offset) : 0};
         return {&elements[prev_offset + elem_size - offset], std::min(length, offset)};
     }
+
+    const ColumnString::Chars & getElements() const { return elements; }
 };
 
 /// Treats Enum values as Strings, modeled after StringSource
@@ -513,11 +515,12 @@ struct FixedStringSource
     const UInt8 * pos;
     const UInt8 * end;
     size_t string_size;
+    const typename ColumnString::Chars & elements;
+
     size_t row_num = 0;
     size_t column_size = 0;
 
-    explicit FixedStringSource(const ColumnFixedString & col)
-        : string_size(col.getN())
+    explicit FixedStringSource(const ColumnFixedString & col) : string_size(col.getN()), elements(col.getChars())
     {
         const auto & chars = col.getChars();
         pos = chars.data();
@@ -588,6 +591,8 @@ struct FixedStringSource
             return {pos, length + string_size > offset ? std::min(string_size, length + string_size - offset) : 0};
         return {pos + string_size - offset, std::min(length, offset)};
     }
+
+    const ColumnString::Chars & getElements() const { return elements; }
 };
 
 
diff --git a/src/Functions/padString.cpp b/src/Functions/padString.cpp
index b26a4ec3d6a..7a424bb1198 100644
--- a/src/Functions/padString.cpp
+++ b/src/Functions/padString.cpp
@@ -211,19 +211,18 @@ namespace
 
                 pad_string = column_pad_const->getValue<String>();
             }
-            PaddingChars<is_utf8> padding_chars{pad_string};
 
             auto col_res = ColumnString::create();
             StringSink res_sink{*col_res, input_rows_count};
 
             if (const ColumnString * col = checkAndGetColumn<ColumnString>(column_string.get()))
-                executeForSource(StringSource{*col}, column_length, padding_chars, res_sink);
+                executeForSource(StringSource{*col}, column_length, pad_string, res_sink);
             else if (const ColumnFixedString * col_fixed = checkAndGetColumn<ColumnFixedString>(column_string.get()))
-                executeForSource(FixedStringSource{*col_fixed}, column_length, padding_chars, res_sink);
+                executeForSource(FixedStringSource{*col_fixed}, column_length, pad_string, res_sink);
             else if (const ColumnConst * col_const = checkAndGetColumnConst<ColumnString>(column_string.get()))
-                executeForSource(ConstSource<StringSource>{*col_const}, column_length, padding_chars, res_sink);
+                executeForSource(ConstSource<StringSource>{*col_const}, column_length, pad_string, res_sink);
             else if (const ColumnConst * col_const_fixed = checkAndGetColumnConst<ColumnFixedString>(column_string.get()))
-                executeForSource(ConstSource<FixedStringSource>{*col_const_fixed}, column_length, padding_chars, res_sink);
+                executeForSource(ConstSource<FixedStringSource>{*col_const_fixed}, column_length, pad_string, res_sink);
             else
                 throw Exception(
                     ErrorCodes::ILLEGAL_COLUMN,
@@ -236,23 +235,39 @@ namespace
 
     private:
         template <typename SourceStrings>
-        void executeForSource(
-            SourceStrings && strings,
-            const ColumnPtr & column_length,
-            const PaddingChars<is_utf8> & padding_chars,
-            StringSink & res_sink) const
+        void executeForSource(SourceStrings && strings, const ColumnPtr & column_length, const String & pad_string, StringSink & res_sink) const
         {
-            if (const auto * col_const = checkAndGetColumn<ColumnConst>(column_length.get()))
-                executeForSourceAndLength(std::forward<SourceStrings>(strings), ConstSource<GenericValueSource>{*col_const}, padding_chars, res_sink);
+            const auto & chars = strings.getElements();
+            bool all_ascii = UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(pad_string.data()), pad_string.size())
+                && UTF8::isAllASCII(chars.data(), chars.size());
+
+            if (all_ascii)
+            {
+                PaddingChars<false> padding_chars{pad_string};
+                if (const auto * col_const = checkAndGetColumn<ColumnConst>(column_length.get()))
+                    executeForSourceAndLength<true>(
+                        std::forward<SourceStrings>(strings), ConstSource<GenericValueSource>{*col_const}, padding_chars, res_sink);
+                else
+                    executeForSourceAndLength<true>(
+                        std::forward<SourceStrings>(strings), GenericValueSource{*column_length}, padding_chars, res_sink);
+            }
             else
-                executeForSourceAndLength(std::forward<SourceStrings>(strings), GenericValueSource{*column_length}, padding_chars, res_sink);
+            {
+                PaddingChars<true> padding_chars{pad_string};
+                if (const auto * col_const = checkAndGetColumn<ColumnConst>(column_length.get()))
+                    executeForSourceAndLength<false>(
+                        std::forward<SourceStrings>(strings), ConstSource<GenericValueSource>{*col_const}, padding_chars, res_sink);
+                else
+                    executeForSourceAndLength<false>(
+                        std::forward<SourceStrings>(strings), GenericValueSource{*column_length}, padding_chars, res_sink);
+            }
         }
 
-        template <typename SourceStrings, typename SourceLengths>
+        template <bool all_ascii, typename SourceStrings, typename SourceLengths>
         void executeForSourceAndLength(
             SourceStrings && strings,
             SourceLengths && lengths,
-            const PaddingChars<is_utf8> & padding_chars,
+            const PaddingChars<!all_ascii> & padding_chars,
             StringSink & res_sink) const
         {
             bool is_const_new_length = lengths.isConst();
@@ -264,7 +279,7 @@ namespace
             for (; !res_sink.isEnd(); res_sink.next(), strings.next(), lengths.next())
             {
                 auto str = strings.getWhole();
-                ssize_t current_length = getLengthOfSlice<is_utf8>(str);
+                ssize_t current_length = getLengthOfSlice<!all_ascii>(str);
 
                 if (!res_sink.rowNum() || !is_const_new_length)
                 {
@@ -294,7 +309,7 @@ namespace
                 }
                 else if (new_length < current_length)
                 {
-                    str = removeSuffixFromSlice<is_utf8>(str, current_length - new_length);
+                    str = removeSuffixFromSlice<!all_ascii>(str, current_length - new_length);
                     writeSlice(str, res_sink);
                 }
                 else if (new_length > current_length)
diff --git a/src/Functions/reverse.h b/src/Functions/reverse.h
index 128a897c041..5f999af4297 100644
--- a/src/Functions/reverse.h
+++ b/src/Functions/reverse.h
@@ -14,7 +14,7 @@ struct ReverseImpl
         ColumnString::Chars & res_data,
         ColumnString::Offsets & res_offsets)
     {
-        res_data.resize(data.size());
+        res_data.resize_exact(data.size());
         res_offsets.assign(offsets);
         size_t size = offsets.size();
 
@@ -30,7 +30,7 @@ struct ReverseImpl
 
     static void vectorFixed(const ColumnString::Chars & data, size_t n, ColumnString::Chars & res_data)
     {
-        res_data.resize(data.size());
+        res_data.resize_exact(data.size());
         size_t size = data.size() / n;
 
         for (size_t i = 0; i < size; ++i)

From 49422debafbf773c887c60f2affb2e038edea911 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 20 Mar 2024 18:59:22 +0800
Subject: [PATCH 013/289] add perf tests

---
 src/Common/UTF8Helpers.cpp  | 3 ++-
 tests/performance/ascii.xml | 9 +++++++++
 2 files changed, 11 insertions(+), 1 deletion(-)
 create mode 100644 tests/performance/ascii.xml

diff --git a/src/Common/UTF8Helpers.cpp b/src/Common/UTF8Helpers.cpp
index 78d645994e5..6e1c3f5397b 100644
--- a/src/Common/UTF8Helpers.cpp
+++ b/src/Common/UTF8Helpers.cpp
@@ -222,7 +222,8 @@ bool isAllASCII(const UInt8 * data, size_t size)
 
 DECLARE_SSE42_SPECIFIC_CODE(
 /// Copy from https://github.com/lemire/fastvalidate-utf-8/blob/master/include/simdasciicheck.h
-bool isAllASCII(const UInt8 * data, size_t size) {
+bool isAllASCII(const UInt8 * data, size_t size)
+{
     size_t i = 0;
     __m128i masks = _mm_setzero_si128();
     if (size >= 16)
diff --git a/tests/performance/ascii.xml b/tests/performance/ascii.xml
new file mode 100644
index 00000000000..89c6dd57e07
--- /dev/null
+++ b/tests/performance/ascii.xml
@@ -0,0 +1,9 @@
+<test>
+    <query>select substringUTF8(materialize('hello world'), 2, 5) from numbers(10000000)</query>
+    <query>select substringIndexUTF8(materialize('www.clickhouse.com'), '.', 2) from numbers(10000000)</query>
+    <query>select reverseUTF8(materialize('hello world')) from numbers(10000000)</query>
+    <query>select lowerUTF8(materialize('hello world')) from numbers(10000000)</query>
+    <query>select upperUTF8(materialize('hello world')) from numbers(10000000)</query>
+    <query>select leftPadUTF8(materialize('hello '), 10, ',') from numbers(10000000)</query>
+    <query>select rightPadUTF8(materialize('hello '), 10, ',') from numbers(10000000)</query>
+</test>

From 83645350fb9f3db299061f939659595cefe771ee Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 20 Mar 2024 22:08:15 +0800
Subject: [PATCH 014/289] fix failed uts

---
 src/Functions/padString.cpp | 2 +-
 src/Functions/substring.cpp | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/padString.cpp b/src/Functions/padString.cpp
index 7a424bb1198..119baaec723 100644
--- a/src/Functions/padString.cpp
+++ b/src/Functions/padString.cpp
@@ -241,7 +241,7 @@ namespace
             bool all_ascii = UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(pad_string.data()), pad_string.size())
                 && UTF8::isAllASCII(chars.data(), chars.size());
 
-            if (all_ascii)
+            if (!is_utf8 || all_ascii)
             {
                 PaddingChars<false> padding_chars{pad_string};
                 if (const auto * col_const = checkAndGetColumn<ColumnConst>(column_length.get()))
diff --git a/src/Functions/substring.cpp b/src/Functions/substring.cpp
index 759d41e2ab8..122f83d758b 100644
--- a/src/Functions/substring.cpp
+++ b/src/Functions/substring.cpp
@@ -161,9 +161,9 @@ public:
                 StringRef str_ref = col_const->getDataAt(0);
                 bool all_ascii = UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(str_ref.data), str_ref.size);
                 if (all_ascii)
-                    return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<UTF8StringSource>(*col_const), input_rows_count);
-                else
                     return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<StringSource>(*col_const), input_rows_count);
+                else
+                    return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<UTF8StringSource>(*col_const), input_rows_count);
             }
             throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}", arguments[0].column->getName(), getName());
         }

From c350991005253183c83fac4d380b368b343f2763 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 21 Mar 2024 10:29:35 +0800
Subject: [PATCH 015/289] add more tests

---
 tests/performance/ascii.xml | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/tests/performance/ascii.xml b/tests/performance/ascii.xml
index 89c6dd57e07..83440437d2c 100644
--- a/tests/performance/ascii.xml
+++ b/tests/performance/ascii.xml
@@ -1,9 +1,22 @@
 <test>
     <query>select substringUTF8(materialize('hello world'), 2, 5) from numbers(10000000)</query>
+    <query>select substringUTF8(materialize('hello 世界'), 2, 5) from numbers(10000000)</query>
+
     <query>select substringIndexUTF8(materialize('www.clickhouse.com'), '.', 2) from numbers(10000000)</query>
+    <query>select substringIndexUTF8(materialize('官网www.clickhouse.com'), '.', 2) from numbers(10000000)</query>
+
     <query>select reverseUTF8(materialize('hello world')) from numbers(10000000)</query>
+    <query>select reverseUTF8(materialize('hello 世界')) from numbers(10000000)</query>
+
     <query>select lowerUTF8(materialize('hello world')) from numbers(10000000)</query>
+    <query>select lowerUTF8(materialize('hello 世界')) from numbers(10000000)</query>
+
     <query>select upperUTF8(materialize('hello world')) from numbers(10000000)</query>
+    <query>select upperUTF8(materialize('hello 世界')) from numbers(10000000)</query>
+
     <query>select leftPadUTF8(materialize('hello '), 10, ',') from numbers(10000000)</query>
+    <query>select leftPadUTF8(materialize('hello '), 10, '世界') from numbers(10000000)</query>
+
     <query>select rightPadUTF8(materialize('hello '), 10, ',') from numbers(10000000)</query>
+    <query>select rightPadUTF8(materialize('hello '), 10, '世界') from numbers(10000000)</query>
 </test>

From 490a8bc7e48d2d87e67ba8d713a01d0fc78a901d Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 21 Mar 2024 10:31:45 +0800
Subject: [PATCH 016/289] apply resize_extact for trim

---
 src/Functions/trim.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/trim.cpp b/src/Functions/trim.cpp
index dd51c606ff7..8b3d2870260 100644
--- a/src/Functions/trim.cpp
+++ b/src/Functions/trim.cpp
@@ -46,8 +46,8 @@ public:
         ColumnString::Offsets & res_offsets)
     {
         size_t size = offsets.size();
-        res_offsets.resize(size);
-        res_data.reserve(data.size());
+        res_offsets.resize_exact(size);
+        res_data.reserve_exact(data.size());
 
         size_t prev_offset = 0;
         size_t res_offset = 0;
@@ -59,7 +59,7 @@ public:
         {
             execute(reinterpret_cast<const UInt8 *>(&data[prev_offset]), offsets[i] - prev_offset - 1, start, length);
 
-            res_data.resize(res_data.size() + length + 1);
+            res_data.resize_exact(res_data.size() + length + 1);
             memcpySmallAllowReadWriteOverflow15(&res_data[res_offset], start, length);
             res_offset += length + 1;
             res_data[res_offset - 1] = '\0';

From ea2fd57cca95d45e4d86260f273abaca67012896 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 00:42:59 +0100
Subject: [PATCH 017/289] Set total_rows_approx for trivial queries with LIMIT
 from system.zeros and generateRandom

---
 src/Interpreters/InterpreterSelectQuery.cpp   |  3 ++
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   |  6 +--
 .../QueryPlan/ReadFromSystemNumbersStep.h     |  2 +
 src/Storages/StorageGenerateRandom.cpp        | 15 ++++--
 src/Storages/System/StorageSystemNumbers.cpp  |  5 +-
 src/Storages/System/StorageSystemZeros.cpp    | 13 +++--
 ...rate_random_with_limit_progress_bar.expect | 49 +++++++++++++++++++
 ...e_random_with_limit_progress_bar.reference |  0
 ...system_zeros_and_generate_random.reference |  0
 ...t_for_system_zeros_and_generate_random.sql |  9 ++++
 10 files changed, 86 insertions(+), 16 deletions(-)
 create mode 100755 tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.expect
 create mode 100644 tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.reference
 create mode 100644 tests/queries/0_stateless/03024_total_rows_approx_is_set_for_system_zeros_and_generate_random.reference
 create mode 100644 tests/queries/0_stateless/03024_total_rows_approx_is_set_for_system_zeros_and_generate_random.sql

diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 7c87dadfce6..fa46b115979 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -2501,10 +2501,13 @@ void InterpreterSelectQuery::executeFetchColumns(QueryProcessingStage::Enum proc
             max_block_size = std::max<UInt64>(1, max_block_limited);
             max_threads_execute_query = max_streams = 1;
         }
+
         if (local_limits.local_limits.size_limits.max_rows != 0)
         {
             if (max_block_limited < local_limits.local_limits.size_limits.max_rows)
                 query_info.limit = max_block_limited;
+            else /// Ask to read just enough rows to make the max_rows limit effective (so it has a chance to be triggered).
+                query_info.limit = 1 + local_limits.local_limits.size_limits.max_rows;
         }
         else
         {
diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 7a61d09bdd2..11371578c79 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -12,8 +12,8 @@
 #include <fmt/format.h>
 #include <Common/iota.h>
 #include <Common/typeid_cast.h>
-#include "Core/Types.h"
-#include "base/types.h"
+#include <Core/Types.h>
+
 
 namespace DB
 {
@@ -443,7 +443,6 @@ Pipe ReadFromSystemNumbersStep::makePipe()
     /// Build rpn of query filters
     KeyCondition condition(filter_actions_dag, context, column_names, key_expression);
 
-
     if (condition.extractPlainRanges(ranges))
     {
         /// Intersect ranges with table range
@@ -505,7 +504,6 @@ Pipe ReadFromSystemNumbersStep::makePipe()
             }
         }
 
-
         /// ranges is blank, return a source who has no data
         if (intersected_ranges.empty())
         {
diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.h b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.h
index cab0686474b..bc84e31be62 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.h
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.h
@@ -8,6 +8,7 @@
 #include <Storages/SelectQueryInfo.h>
 #include <Storages/StorageSnapshot.h>
 
+
 namespace DB
 {
 
@@ -43,4 +44,5 @@ private:
     UInt64 limit;
     std::shared_ptr<const StorageLimitsList> storage_limits;
 };
+
 }
diff --git a/src/Storages/StorageGenerateRandom.cpp b/src/Storages/StorageGenerateRandom.cpp
index fbce6c2bb7d..cdbade51695 100644
--- a/src/Storages/StorageGenerateRandom.cpp
+++ b/src/Storages/StorageGenerateRandom.cpp
@@ -3,6 +3,7 @@
 #include <Storages/StorageGenerateRandom.h>
 #include <Storages/StorageFactory.h>
 #include <Storages/checkAndGetLiteralArgument.h>
+#include <Storages/SelectQueryInfo.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
 #include <QueryPipeline/Pipe.h>
 #include <Parsers/ASTLiteral.h>
@@ -30,12 +31,9 @@
 #include <Common/SipHash.h>
 #include <Common/randomSeed.h>
 #include <Interpreters/Context.h>
-#include <base/unaligned.h>
 
 #include <Functions/FunctionFactory.h>
 
-#include <pcg_random.hpp>
-
 
 namespace DB
 {
@@ -639,7 +637,7 @@ void registerStorageGenerateRandom(StorageFactory & factory)
 Pipe StorageGenerateRandom::read(
     const Names & column_names,
     const StorageSnapshotPtr & storage_snapshot,
-    SelectQueryInfo & /*query_info*/,
+    SelectQueryInfo & query_info,
     ContextPtr context,
     QueryProcessingStage::Enum /*processed_stage*/,
     size_t max_block_size,
@@ -682,7 +680,14 @@ Pipe StorageGenerateRandom::read(
     pcg64 generate(random_seed);
 
     for (UInt64 i = 0; i < num_streams; ++i)
-        pipes.emplace_back(std::make_shared<GenerateSource>(max_block_size, max_array_length, max_string_length, generate(), block_header, context));
+    {
+        auto source = std::make_shared<GenerateSource>(max_block_size, max_array_length, max_string_length, generate(), block_header, context);
+
+        if (i == 0 && query_info.limit)
+            source->addTotalRowsApprox(query_info.limit);
+
+        pipes.emplace_back(std::move(source));
+    }
 
     return Pipe::unitePipes(std::move(pipes));
 }
diff --git a/src/Storages/System/StorageSystemNumbers.cpp b/src/Storages/System/StorageSystemNumbers.cpp
index 629b11ee7f1..da700a7a4e9 100644
--- a/src/Storages/System/StorageSystemNumbers.cpp
+++ b/src/Storages/System/StorageSystemNumbers.cpp
@@ -1,17 +1,14 @@
 #include <Storages/System/StorageSystemNumbers.h>
 
 #include <mutex>
-#include <Columns/ColumnsNumber.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Interpreters/InterpreterSelectQuery.h>
-#include <Processors/ISource.h>
 #include <Processors/LimitTransform.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/ReadFromSystemNumbersStep.h>
-#include <Processors/Sources/NullSource.h>
-#include <QueryPipeline/Pipe.h>
 #include <Storages/SelectQueryInfo.h>
 
+
 namespace DB
 {
 
diff --git a/src/Storages/System/StorageSystemZeros.cpp b/src/Storages/System/StorageSystemZeros.cpp
index ce2e153ea66..a48b109fbbe 100644
--- a/src/Storages/System/StorageSystemZeros.cpp
+++ b/src/Storages/System/StorageSystemZeros.cpp
@@ -1,4 +1,5 @@
 #include <Storages/System/StorageSystemZeros.h>
+#include <Storages/SelectQueryInfo.h>
 
 #include <Processors/ISource.h>
 #include <QueryPipeline/Pipe.h>
@@ -6,6 +7,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <Columns/ColumnsNumber.h>
 
+
 namespace DB
 {
 
@@ -93,7 +95,7 @@ StorageSystemZeros::StorageSystemZeros(const StorageID & table_id_, bool multith
 Pipe StorageSystemZeros::read(
     const Names & column_names,
     const StorageSnapshotPtr & storage_snapshot,
-    SelectQueryInfo &,
+    SelectQueryInfo & query_info,
     ContextPtr /*context*/,
     QueryProcessingStage::Enum /*processed_stage*/,
     size_t max_block_size,
@@ -123,8 +125,13 @@ Pipe StorageSystemZeros::read(
     {
         auto source = std::make_shared<ZerosSource>(max_block_size, limit ? *limit : 0, state);
 
-        if (limit && i == 0)
-            source->addTotalRowsApprox(*limit);
+        if (i == 0)
+        {
+            if (limit)
+                source->addTotalRowsApprox(*limit);
+            else if (query_info.limit)
+                source->addTotalRowsApprox(query_info.limit);
+        }
 
         res.addSource(std::move(source));
     }
diff --git a/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.expect b/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.expect
new file mode 100755
index 00000000000..272dc0fdfef
--- /dev/null
+++ b/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.expect
@@ -0,0 +1,49 @@
+#!/usr/bin/expect -f
+
+set basedir [file dirname $argv0]
+set basename [file tail $argv0]
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+
+log_user 0
+set timeout 60
+match_max 100000
+set stty_init "rows 25 cols 120"
+
+expect_after {
+    -i $any_spawn_id eof { exp_continue }
+    -i $any_spawn_id timeout { exit 1 }
+}
+
+spawn clickhouse-local
+expect ":) "
+
+# Trivial SELECT with LIMIT from system.zeros shows progress bar.
+send "SELECT * FROM system.zeros LIMIT 1e11 FORMAT Null\r"
+expect "Progress: "
+expect "█"
+send "\3"
+expect "Query was cancelled."
+expect ":) "
+
+send "SELECT * FROM system.zeros_mt LIMIT 1e11 FORMAT Null\r"
+expect "Progress: "
+expect "█"
+send "\3"
+expect "Query was cancelled."
+expect ":) "
+
+# As well as from generateRandom
+send "SELECT * FROM generateRandom() LIMIT 1e9 FORMAT Null\r"
+expect "Progress: "
+expect "█"
+send "\3"
+expect "Query was cancelled."
+expect ":) "
+
+send "exit\r"
+expect eof
diff --git a/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.reference b/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03024_total_rows_approx_is_set_for_system_zeros_and_generate_random.reference b/tests/queries/0_stateless/03024_total_rows_approx_is_set_for_system_zeros_and_generate_random.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03024_total_rows_approx_is_set_for_system_zeros_and_generate_random.sql b/tests/queries/0_stateless/03024_total_rows_approx_is_set_for_system_zeros_and_generate_random.sql
new file mode 100644
index 00000000000..0db09ead2cd
--- /dev/null
+++ b/tests/queries/0_stateless/03024_total_rows_approx_is_set_for_system_zeros_and_generate_random.sql
@@ -0,0 +1,9 @@
+SET max_rows_to_read = 1e11;
+
+SELECT * FROM system.numbers LIMIT 1e12 FORMAT Null; -- { serverError TOO_MANY_ROWS }
+SELECT * FROM system.numbers_mt LIMIT 1e12 FORMAT Null; -- { serverError TOO_MANY_ROWS }
+
+SELECT * FROM system.zeros LIMIT 1e12 FORMAT Null; -- { serverError TOO_MANY_ROWS }
+SELECT * FROM system.zeros_mt LIMIT 1e12 FORMAT Null; -- { serverError TOO_MANY_ROWS }
+
+SELECT * FROM generateRandom() LIMIT 1e12 FORMAT Null; -- { serverError TOO_MANY_ROWS }

From 86039802e3327c0a527135233f3589d6bcea2348 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 00:46:48 +0100
Subject: [PATCH 018/289] Set total_rows_approx for trivial queries with LIMIT
 from system.zeros and generateRandom

---
 src/Interpreters/InterpreterSelectQuery.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index fa46b115979..65beef27d16 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -2506,7 +2506,7 @@ void InterpreterSelectQuery::executeFetchColumns(QueryProcessingStage::Enum proc
         {
             if (max_block_limited < local_limits.local_limits.size_limits.max_rows)
                 query_info.limit = max_block_limited;
-            else /// Ask to read just enough rows to make the max_rows limit effective (so it has a chance to be triggered).
+            else if (local_limits.local_limits.size_limits.max_rows < std::numeric_limits<UInt64>::max()) /// Ask to read just enough rows to make the max_rows limit effective (so it has a chance to be triggered).
                 query_info.limit = 1 + local_limits.local_limits.size_limits.max_rows;
         }
         else

From c55e45bff6212e8e4828198fd13a56bc174d2062 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 18:58:57 +0100
Subject: [PATCH 019/289] Test robustness

---
 ...023_zeros_generate_random_with_limit_progress_bar.expect | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.expect b/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.expect
index 272dc0fdfef..de15a199132 100755
--- a/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.expect
+++ b/tests/queries/0_stateless/03023_zeros_generate_random_with_limit_progress_bar.expect
@@ -23,14 +23,14 @@ spawn clickhouse-local
 expect ":) "
 
 # Trivial SELECT with LIMIT from system.zeros shows progress bar.
-send "SELECT * FROM system.zeros LIMIT 1e11 FORMAT Null\r"
+send "SELECT * FROM system.zeros LIMIT 10000000 FORMAT Null SETTINGS max_execution_speed = 1000000, timeout_before_checking_execution_speed = 0, max_block_size = 128\r"
 expect "Progress: "
 expect "█"
 send "\3"
 expect "Query was cancelled."
 expect ":) "
 
-send "SELECT * FROM system.zeros_mt LIMIT 1e11 FORMAT Null\r"
+send "SELECT * FROM system.zeros_mt LIMIT 10000000 FORMAT Null SETTINGS max_execution_speed = 1000000, timeout_before_checking_execution_speed = 0, max_block_size = 128\r"
 expect "Progress: "
 expect "█"
 send "\3"
@@ -38,7 +38,7 @@ expect "Query was cancelled."
 expect ":) "
 
 # As well as from generateRandom
-send "SELECT * FROM generateRandom() LIMIT 1e9 FORMAT Null\r"
+send "SELECT * FROM generateRandom() LIMIT 10000000 FORMAT Null SETTINGS max_execution_speed = 1000000, timeout_before_checking_execution_speed = 0, max_block_size = 128\r"
 expect "Progress: "
 expect "█"
 send "\3"

From 98c2048d30d0a6e324875c98a4f138e7ee92734a Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Sun, 31 Mar 2024 22:12:03 +0200
Subject: [PATCH 020/289] try to improve Storage S3 selection glob performance

---
 src/Storages/StorageS3.cpp | 122 +++++++++++++++++++++++++++++--------
 1 file changed, 98 insertions(+), 24 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 2d3aef312bf..cee9f11af95 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -210,32 +210,36 @@ public:
         if (globbed_uri.bucket.find_first_of("*?{") != globbed_uri.bucket.npos)
             throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION, "Expression can not have wildcards inside bucket name");
 
-        const String key_prefix = globbed_uri.key.substr(0, globbed_uri.key.find_first_of("*?{"));
-
-        /// We don't have to list bucket, because there is no asterisks.
-        if (key_prefix.size() == globbed_uri.key.size())
+        for (const auto & key : expandSelectionGlob(globbed_uri.key))
         {
-            buffer.emplace_back(std::make_shared<KeyWithInfo>(globbed_uri.key, std::nullopt));
-            buffer_iter = buffer.begin();
-            is_finished = true;
-            return;
+            const String key_prefix = key.substr(0, key.find_first_of("*?{"));
+
+            /// We don't have to list bucket, because there is no asterisks.
+            if (key_prefix.size() == key.size())
+            {
+                buffer.emplace_back(std::make_shared<KeyWithInfo>(key, std::nullopt));
+                buffer_iter = buffer.begin();
+                is_finished = true;
+                return;
+            }
+
+            request.SetBucket(globbed_uri.bucket);
+            request.SetPrefix(key_prefix);
+            request.SetMaxKeys(static_cast<int>(request_settings.list_object_keys_size));
+
+            outcome_future = listObjectsAsync();
+
+            matcher = std::make_unique<re2::RE2>(makeRegexpPatternFromGlobs(key));
+            if (!matcher->ok())
+                throw Exception(
+                    ErrorCodes::CANNOT_COMPILE_REGEXP, "Cannot compile regex from glob ({}): {}", key, matcher->error());
+
+            recursive = key == "/**";
+
+            filter_dag = VirtualColumnUtils::createPathAndFileFilterDAG(predicate, virtual_columns);
+            updateInternalBufferAssumeLocked();
         }
-
-        request.SetBucket(globbed_uri.bucket);
-        request.SetPrefix(key_prefix);
-        request.SetMaxKeys(static_cast<int>(request_settings.list_object_keys_size));
-
-        outcome_future = listObjectsAsync();
-
-        matcher = std::make_unique<re2::RE2>(makeRegexpPatternFromGlobs(globbed_uri.key));
-        if (!matcher->ok())
-            throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
-                "Cannot compile regex from glob ({}): {}", globbed_uri.key, matcher->error());
-
-        recursive = globbed_uri.key == "/**" ? true : false;
-
-        filter_dag = VirtualColumnUtils::createPathAndFileFilterDAG(predicate, virtual_columns);
-        fillInternalBufferAssumeLocked();
+        buffer_iter = buffer.begin();
     }
 
     KeyWithInfoPtr next(size_t)
@@ -301,6 +305,76 @@ private:
         } while (true);
     }
 
+    void updateInternalBufferAssumeLocked()
+    {
+        assert(outcome_future.valid());
+        auto outcome = outcome_future.get();
+
+        if (!outcome.IsSuccess())
+        {
+            throw S3Exception(outcome.GetError().GetErrorType(), "Could not list objects in bucket {} with prefix {}, S3 exception: {}, message: {}",
+                              quoteString(request.GetBucket()), quoteString(request.GetPrefix()),
+                              backQuote(outcome.GetError().GetExceptionName()), quoteString(outcome.GetError().GetMessage()));
+        }
+
+        const auto & result_batch = outcome.GetResult().GetContents();
+
+        /// It returns false when all objects were returned
+        is_finished = !outcome.GetResult().GetIsTruncated();
+
+        if (!is_finished)
+        {
+            /// Even if task is finished the thread may be not freed in pool.
+            /// So wait until it will be freed before scheduling a new task.
+            list_objects_pool.wait();
+            outcome_future = listObjectsAsync();
+        }
+
+        if (request_settings.throw_on_zero_files_match && result_batch.empty())
+            throw Exception(ErrorCodes::FILE_DOESNT_EXIST, "Can not match any files using prefix {}", request.GetPrefix());
+
+        KeysWithInfo temp_buffer;
+        temp_buffer.reserve(result_batch.size());
+
+        for (const auto & row : result_batch)
+        {
+            String key = row.GetKey();
+            if (recursive || re2::RE2::FullMatch(key, *matcher))
+            {
+                S3::ObjectInfo info =
+                    {
+                        .size = size_t(row.GetSize()),
+                        .last_modification_time = row.GetLastModified().Millis() / 1000,
+                    };
+                temp_buffer.emplace_back(std::make_shared<KeyWithInfo>(std::move(key), std::move(info)));
+            }
+        }
+
+        if (temp_buffer.empty())
+            return;
+
+        if (filter_dag)
+        {
+            std::vector<String> paths;
+            paths.reserve(temp_buffer.size());
+            for (const auto & key_with_info : temp_buffer)
+                paths.push_back(fs::path(globbed_uri.bucket) / key_with_info->key);
+
+            VirtualColumnUtils::filterByPathOrFile(temp_buffer, paths, filter_dag, virtual_columns, getContext());
+        }
+
+        buffer.insert(buffer.end(), temp_buffer.begin(), temp_buffer.end());
+
+        if (read_keys)
+            read_keys->insert(read_keys->end(), temp_buffer.begin(), temp_buffer.end());
+
+        if (file_progress_callback)
+        {
+            for (const auto & key_with_info : buffer)
+                file_progress_callback(FileProgress(0, key_with_info->info->size));
+        }
+    }
+
     void fillInternalBufferAssumeLocked()
     {
         buffer.clear();

From 73b9ef99f4315e89d6f184d836e01da4345151ba Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Mon, 1 Apr 2024 17:40:40 +0200
Subject: [PATCH 021/289] Revert "try to improve Storage S3 selection glob
 performance"

This reverts commit 9c9421b6897bf4a95346cef52171839ef67bd522.
---
 src/Storages/StorageS3.cpp | 122 ++++++++-----------------------------
 1 file changed, 24 insertions(+), 98 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index cee9f11af95..2d3aef312bf 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -210,36 +210,32 @@ public:
         if (globbed_uri.bucket.find_first_of("*?{") != globbed_uri.bucket.npos)
             throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION, "Expression can not have wildcards inside bucket name");
 
-        for (const auto & key : expandSelectionGlob(globbed_uri.key))
+        const String key_prefix = globbed_uri.key.substr(0, globbed_uri.key.find_first_of("*?{"));
+
+        /// We don't have to list bucket, because there is no asterisks.
+        if (key_prefix.size() == globbed_uri.key.size())
         {
-            const String key_prefix = key.substr(0, key.find_first_of("*?{"));
-
-            /// We don't have to list bucket, because there is no asterisks.
-            if (key_prefix.size() == key.size())
-            {
-                buffer.emplace_back(std::make_shared<KeyWithInfo>(key, std::nullopt));
-                buffer_iter = buffer.begin();
-                is_finished = true;
-                return;
-            }
-
-            request.SetBucket(globbed_uri.bucket);
-            request.SetPrefix(key_prefix);
-            request.SetMaxKeys(static_cast<int>(request_settings.list_object_keys_size));
-
-            outcome_future = listObjectsAsync();
-
-            matcher = std::make_unique<re2::RE2>(makeRegexpPatternFromGlobs(key));
-            if (!matcher->ok())
-                throw Exception(
-                    ErrorCodes::CANNOT_COMPILE_REGEXP, "Cannot compile regex from glob ({}): {}", key, matcher->error());
-
-            recursive = key == "/**";
-
-            filter_dag = VirtualColumnUtils::createPathAndFileFilterDAG(predicate, virtual_columns);
-            updateInternalBufferAssumeLocked();
+            buffer.emplace_back(std::make_shared<KeyWithInfo>(globbed_uri.key, std::nullopt));
+            buffer_iter = buffer.begin();
+            is_finished = true;
+            return;
         }
-        buffer_iter = buffer.begin();
+
+        request.SetBucket(globbed_uri.bucket);
+        request.SetPrefix(key_prefix);
+        request.SetMaxKeys(static_cast<int>(request_settings.list_object_keys_size));
+
+        outcome_future = listObjectsAsync();
+
+        matcher = std::make_unique<re2::RE2>(makeRegexpPatternFromGlobs(globbed_uri.key));
+        if (!matcher->ok())
+            throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
+                "Cannot compile regex from glob ({}): {}", globbed_uri.key, matcher->error());
+
+        recursive = globbed_uri.key == "/**" ? true : false;
+
+        filter_dag = VirtualColumnUtils::createPathAndFileFilterDAG(predicate, virtual_columns);
+        fillInternalBufferAssumeLocked();
     }
 
     KeyWithInfoPtr next(size_t)
@@ -305,76 +301,6 @@ private:
         } while (true);
     }
 
-    void updateInternalBufferAssumeLocked()
-    {
-        assert(outcome_future.valid());
-        auto outcome = outcome_future.get();
-
-        if (!outcome.IsSuccess())
-        {
-            throw S3Exception(outcome.GetError().GetErrorType(), "Could not list objects in bucket {} with prefix {}, S3 exception: {}, message: {}",
-                              quoteString(request.GetBucket()), quoteString(request.GetPrefix()),
-                              backQuote(outcome.GetError().GetExceptionName()), quoteString(outcome.GetError().GetMessage()));
-        }
-
-        const auto & result_batch = outcome.GetResult().GetContents();
-
-        /// It returns false when all objects were returned
-        is_finished = !outcome.GetResult().GetIsTruncated();
-
-        if (!is_finished)
-        {
-            /// Even if task is finished the thread may be not freed in pool.
-            /// So wait until it will be freed before scheduling a new task.
-            list_objects_pool.wait();
-            outcome_future = listObjectsAsync();
-        }
-
-        if (request_settings.throw_on_zero_files_match && result_batch.empty())
-            throw Exception(ErrorCodes::FILE_DOESNT_EXIST, "Can not match any files using prefix {}", request.GetPrefix());
-
-        KeysWithInfo temp_buffer;
-        temp_buffer.reserve(result_batch.size());
-
-        for (const auto & row : result_batch)
-        {
-            String key = row.GetKey();
-            if (recursive || re2::RE2::FullMatch(key, *matcher))
-            {
-                S3::ObjectInfo info =
-                    {
-                        .size = size_t(row.GetSize()),
-                        .last_modification_time = row.GetLastModified().Millis() / 1000,
-                    };
-                temp_buffer.emplace_back(std::make_shared<KeyWithInfo>(std::move(key), std::move(info)));
-            }
-        }
-
-        if (temp_buffer.empty())
-            return;
-
-        if (filter_dag)
-        {
-            std::vector<String> paths;
-            paths.reserve(temp_buffer.size());
-            for (const auto & key_with_info : temp_buffer)
-                paths.push_back(fs::path(globbed_uri.bucket) / key_with_info->key);
-
-            VirtualColumnUtils::filterByPathOrFile(temp_buffer, paths, filter_dag, virtual_columns, getContext());
-        }
-
-        buffer.insert(buffer.end(), temp_buffer.begin(), temp_buffer.end());
-
-        if (read_keys)
-            read_keys->insert(read_keys->end(), temp_buffer.begin(), temp_buffer.end());
-
-        if (file_progress_callback)
-        {
-            for (const auto & key_with_info : buffer)
-                file_progress_callback(FileProgress(0, key_with_info->info->size));
-        }
-    }
-
     void fillInternalBufferAssumeLocked()
     {
         buffer.clear();

From 70da13b9b01d0e9a86b313bdcf165b6c54a4b985 Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Mon, 1 Apr 2024 22:34:54 +0200
Subject: [PATCH 022/289] simpler way

---
 src/Storages/StorageS3.cpp | 76 +++++++++++++++++++++++++-------------
 1 file changed, 51 insertions(+), 25 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 2d3aef312bf..844f5362ec2 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -191,7 +191,7 @@ public:
     Impl(
         const S3::Client & client_,
         const S3::URI & globbed_uri_,
-        const ActionsDAG::Node * predicate,
+        const ActionsDAG::Node * predicate_,
         const NamesAndTypesList & virtual_columns_,
         ContextPtr context_,
         KeysWithInfo * read_keys_,
@@ -200,6 +200,7 @@ public:
         : WithContext(context_)
         , client(client_.clone())
         , globbed_uri(globbed_uri_)
+        , predicate(predicate_)
         , virtual_columns(virtual_columns_)
         , read_keys(read_keys_)
         , request_settings(request_settings_)
@@ -210,32 +211,13 @@ public:
         if (globbed_uri.bucket.find_first_of("*?{") != globbed_uri.bucket.npos)
             throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION, "Expression can not have wildcards inside bucket name");
 
-        const String key_prefix = globbed_uri.key.substr(0, globbed_uri.key.find_first_of("*?{"));
+        expanded_keys = expandSelectionGlob(globbed_uri.key);
+        expanded_keys_iter = expanded_keys.begin();
 
-        /// We don't have to list bucket, because there is no asterisks.
-        if (key_prefix.size() == globbed_uri.key.size())
-        {
-            buffer.emplace_back(std::make_shared<KeyWithInfo>(globbed_uri.key, std::nullopt));
-            buffer_iter = buffer.begin();
+        bool no_globs_in_key = fillBufferForKey(*expanded_keys_iter);
+        expanded_keys_iter++;
+        if (expanded_keys_iter == expanded_keys.end() && no_globs_in_key)
             is_finished = true;
-            return;
-        }
-
-        request.SetBucket(globbed_uri.bucket);
-        request.SetPrefix(key_prefix);
-        request.SetMaxKeys(static_cast<int>(request_settings.list_object_keys_size));
-
-        outcome_future = listObjectsAsync();
-
-        matcher = std::make_unique<re2::RE2>(makeRegexpPatternFromGlobs(globbed_uri.key));
-        if (!matcher->ok())
-            throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
-                "Cannot compile regex from glob ({}): {}", globbed_uri.key, matcher->error());
-
-        recursive = globbed_uri.key == "/**" ? true : false;
-
-        filter_dag = VirtualColumnUtils::createPathAndFileFilterDAG(predicate, virtual_columns);
-        fillInternalBufferAssumeLocked();
     }
 
     KeyWithInfoPtr next(size_t)
@@ -257,6 +239,37 @@ public:
 private:
     using ListObjectsOutcome = Aws::S3::Model::ListObjectsV2Outcome;
 
+    bool fillBufferForKey(const std::string & uri_key)
+    {
+        const String key_prefix = uri_key.substr(0, uri_key.find_first_of("*?{"));
+
+        /// We don't have to list bucket, because there is no asterisks.
+        if (key_prefix.size() == uri_key.size())
+        {
+            buffer.clear();
+            buffer.emplace_back(std::make_shared<KeyWithInfo>(uri_key, std::nullopt));
+            buffer_iter = buffer.begin();
+            return true;
+        }
+
+        request.SetBucket(globbed_uri.bucket);
+        request.SetPrefix(key_prefix);
+        request.SetMaxKeys(static_cast<int>(request_settings.list_object_keys_size));
+
+        outcome_future = listObjectsAsync();
+
+        matcher = std::make_unique<re2::RE2>(makeRegexpPatternFromGlobs(uri_key));
+        if (!matcher->ok())
+            throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
+                            "Cannot compile regex from glob ({}): {}", uri_key, matcher->error());
+
+        recursive = globbed_uri.key == "/**";
+
+        filter_dag = VirtualColumnUtils::createPathAndFileFilterDAG(predicate, virtual_columns);
+        fillInternalBufferAssumeLocked();
+        return false;
+    }
+
     KeyWithInfoPtr nextAssumeLocked()
     {
         do
@@ -278,6 +291,15 @@ private:
                 return answer;
             }
 
+            if (expanded_keys_iter != expanded_keys.end())
+            {
+                bool no_globs_in_key = fillBufferForKey(*expanded_keys_iter);
+                expanded_keys_iter++;
+                if (expanded_keys_iter == expanded_keys.end() && no_globs_in_key)
+                    is_finished = true;
+                continue;
+            }
+
             if (is_finished)
                 return {};
 
@@ -399,8 +421,12 @@ private:
     KeysWithInfo buffer;
     KeysWithInfo::iterator buffer_iter;
 
+    std::vector<String> expanded_keys;
+    std::vector<String>::iterator expanded_keys_iter;
+
     std::unique_ptr<S3::Client> client;
     S3::URI globbed_uri;
+    const ActionsDAG::Node * predicate;
     ASTPtr query;
     NamesAndTypesList virtual_columns;
     ActionsDAGPtr filter_dag;

From a177fbfd8cb52c64f096797a6c65fdc4dfeb828e Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Tue, 2 Apr 2024 00:05:53 +0200
Subject: [PATCH 023/289] ignore error when one of selection options not exist

---
 src/Storages/StorageS3.cpp | 13 ++++++++++++-
 1 file changed, 12 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 844f5362ec2..09a5ffc86a5 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -283,7 +283,18 @@ private:
                 /// So we get object info lazily here on 'next()' request.
                 if (!answer->info)
                 {
-                    answer->info = S3::getObjectInfo(*client, globbed_uri.bucket, answer->key, globbed_uri.version_id, request_settings);
+                    try
+                    {
+                        answer->info = S3::getObjectInfo(*client, globbed_uri.bucket, answer->key, globbed_uri.version_id, request_settings);
+                    }
+                    catch (...)
+                    {
+                        /// if no such file AND there was no `{}` glob -- this is an exception
+                        /// otherwise ignore it, this is acceptable
+                        if (expanded_keys.size() == 1)
+                            throw;
+                        continue;
+                    }
                     if (file_progress_callback)
                         file_progress_callback(FileProgress(0, answer->info->size));
                 }

From 5f190e6774aa1a38e6aae740b97f51882355cd25 Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Tue, 2 Apr 2024 11:12:34 +0000
Subject: [PATCH 024/289] Use intrusive lists for `ResourceRequest` instead of
 deque

---
 src/Common/Scheduler/Nodes/FifoQueue.h | 39 +++++++++++++++-----------
 src/Common/Scheduler/ResourceRequest.h |  4 ++-
 2 files changed, 26 insertions(+), 17 deletions(-)

diff --git a/src/Common/Scheduler/Nodes/FifoQueue.h b/src/Common/Scheduler/Nodes/FifoQueue.h
index 45ed32343ff..9ec997c06d2 100644
--- a/src/Common/Scheduler/Nodes/FifoQueue.h
+++ b/src/Common/Scheduler/Nodes/FifoQueue.h
@@ -6,7 +6,8 @@
 
 #include <Poco/Util/AbstractConfiguration.h>
 
-#include <deque>
+#include <boost/intrusive/list.hpp>
+
 #include <mutex>
 
 
@@ -15,6 +16,7 @@ namespace DB
 
 namespace ErrorCodes
 {
+    extern const int LOGICAL_ERROR;
     extern const int INVALID_SCHEDULER_NODE;
 }
 
@@ -42,7 +44,7 @@ public:
         std::lock_guard lock(mutex);
         queue_cost += request->cost;
         bool was_empty = requests.empty();
-        requests.push_back(request);
+        requests.push_back(*request);
         if (was_empty)
             scheduleActivation();
     }
@@ -52,7 +54,7 @@ public:
         std::lock_guard lock(mutex);
         if (requests.empty())
             return {nullptr, false};
-        ResourceRequest * result = requests.front();
+        ResourceRequest * result = &requests.front();
         requests.pop_front();
         if (requests.empty())
             busy_periods++;
@@ -65,19 +67,24 @@ public:
     bool cancelRequest(ResourceRequest * request) override
     {
         std::lock_guard lock(mutex);
-        // TODO(serxa): reimplement queue as intrusive list of ResourceRequest to make this O(1) instead of O(N)
-        for (auto i = requests.begin(), e = requests.end(); i != e; ++i)
+        if (request->is_linked())
         {
-            if (*i == request)
-            {
-                requests.erase(i);
-                if (requests.empty())
-                    busy_periods++;
-                queue_cost -= request->cost;
-                canceled_requests++;
-                canceled_cost += request->cost;
-                return true;
-            }
+            // It's impossible to check that `request` is indeed inserted to this queue and not another queue.
+            // It's up to caller to make sure this is the case. Otherwise, list sizes will be corrupted.
+            // Not tracking list sizes is not an option, because another problem appears: removing from list w/o locking.
+            // Another possible solution - keep track if request `is_cancelable` guarded by `mutex`
+            // Simple check for list size corruption
+            if (requests.empty())
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "trying to cancel request (linked into another queue) from empty queue: {}", getPath());
+
+            requests.erase(requests.iterator_to(*request));
+
+            if (requests.empty())
+                busy_periods++;
+            queue_cost -= request->cost;
+            canceled_requests++;
+            canceled_cost += request->cost;
+            return true;
         }
         return false;
     }
@@ -124,7 +131,7 @@ public:
 private:
     std::mutex mutex;
     Int64 queue_cost = 0;
-    std::deque<ResourceRequest *> requests; // TODO(serxa): reimplement it using intrusive list to avoid allocations/deallocations and O(N) during cancel
+    boost::intrusive::list<ResourceRequest> requests;
 };
 
 }
diff --git a/src/Common/Scheduler/ResourceRequest.h b/src/Common/Scheduler/ResourceRequest.h
index f3153ad382c..d64f624cec5 100644
--- a/src/Common/Scheduler/ResourceRequest.h
+++ b/src/Common/Scheduler/ResourceRequest.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <boost/intrusive/list.hpp>
 #include <base/types.h>
 #include <limits>
 
@@ -41,7 +42,7 @@ constexpr ResourceCost ResourceCostMax = std::numeric_limits<int>::max();
  * Returning true means successful cancel and therefore steps (4) and (5) are not going to happen
  * and step (6) MUST be omitted.
  */
-class ResourceRequest
+class ResourceRequest : public boost::intrusive::list_base_hook<>
 {
 public:
     /// Cost of request execution; should be filled before request enqueueing.
@@ -62,6 +63,7 @@ public:
     {
         cost = cost_;
         constraint = nullptr;
+        // Note that list_base_hook should be reset independently (by intrusive list)
     }
 
     virtual ~ResourceRequest() = default;

From 7232bf45768f56c768ac03ed4b34c085bc6f060a Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Tue, 2 Apr 2024 16:12:11 +0200
Subject: [PATCH 025/289] no reuse request

---
 src/Storages/StorageS3.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 09a5ffc86a5..28bfa3c32a9 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -252,6 +252,7 @@ private:
             return true;
         }
 
+        request = S3::ListObjectsV2Request{};
         request.SetBucket(globbed_uri.bucket);
         request.SetPrefix(key_prefix);
         request.SetMaxKeys(static_cast<int>(request_settings.list_object_keys_size));

From 25cab6f0713221e32b2c2fef844e2c2fde77e985 Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Wed, 3 Apr 2024 20:57:10 +0200
Subject: [PATCH 026/289] fix schema inference cache (1)

---
 src/Storages/StorageS3.cpp | 19 +++++++++++--------
 1 file changed, 11 insertions(+), 8 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 28bfa3c32a9..b19e61762d1 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -217,7 +217,7 @@ public:
         bool no_globs_in_key = fillBufferForKey(*expanded_keys_iter);
         expanded_keys_iter++;
         if (expanded_keys_iter == expanded_keys.end() && no_globs_in_key)
-            is_finished = true;
+            is_finished_for_key = true;
     }
 
     KeyWithInfoPtr next(size_t)
@@ -241,6 +241,7 @@ private:
 
     bool fillBufferForKey(const std::string & uri_key)
     {
+        is_finished_for_key = false;
         const String key_prefix = uri_key.substr(0, uri_key.find_first_of("*?{"));
 
         /// We don't have to list bucket, because there is no asterisks.
@@ -249,10 +250,12 @@ private:
             buffer.clear();
             buffer.emplace_back(std::make_shared<KeyWithInfo>(uri_key, std::nullopt));
             buffer_iter = buffer.begin();
+            if (read_keys)
+                read_keys->insert(read_keys->end(), buffer.begin(), buffer.end());
             return true;
         }
 
-        request = S3::ListObjectsV2Request{};
+        request = {};
         request.SetBucket(globbed_uri.bucket);
         request.SetPrefix(key_prefix);
         request.SetMaxKeys(static_cast<int>(request_settings.list_object_keys_size));
@@ -308,11 +311,11 @@ private:
                 bool no_globs_in_key = fillBufferForKey(*expanded_keys_iter);
                 expanded_keys_iter++;
                 if (expanded_keys_iter == expanded_keys.end() && no_globs_in_key)
-                    is_finished = true;
+                    is_finished_for_key = true;
                 continue;
             }
 
-            if (is_finished)
+            if (is_finished_for_key)
                 return {};
 
             try
@@ -327,7 +330,7 @@ private:
                 /// it may take some time for threads to stop processors and they
                 /// may still use this iterator after exception is thrown.
                 /// To avoid this UB, reset the buffer and return defaults for further calls.
-                is_finished = true;
+                is_finished_for_key = true;
                 buffer.clear();
                 buffer_iter = buffer.begin();
                 throw;
@@ -351,9 +354,9 @@ private:
         const auto & result_batch = outcome.GetResult().GetContents();
 
         /// It returns false when all objects were returned
-        is_finished = !outcome.GetResult().GetIsTruncated();
+        is_finished_for_key = !outcome.GetResult().GetIsTruncated();
 
-        if (!is_finished)
+        if (!is_finished_for_key)
         {
             /// Even if task is finished the thread may be not freed in pool.
             /// So wait until it will be freed before scheduling a new task.
@@ -444,7 +447,7 @@ private:
     ActionsDAGPtr filter_dag;
     std::unique_ptr<re2::RE2> matcher;
     bool recursive{false};
-    bool is_finished{false};
+    bool is_finished_for_key{false};
     KeysWithInfo * read_keys;
 
     S3::ListObjectsV2Request request;

From ce3969e25d7ef8bd661fa6047ac0882735fd567a Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Thu, 4 Apr 2024 19:47:34 +0000
Subject: [PATCH 027/289] adapt test to new behavior

---
 tests/integration/test_storage_s3/test.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index 6d5b84a8143..9d275575f8a 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -1768,13 +1768,13 @@ def test_schema_inference_cache(started_cluster):
         check_cache(instance, [])
 
         run_describe_query(instance, files, storage_name, started_cluster, bucket)
-        check_cache_misses(instance, files, storage_name, started_cluster, bucket, 4)
+        check_cache_misses(instance, files, storage_name, started_cluster, bucket, 4 if storage_name == "url" else 1)
 
         instance.query("system drop schema cache")
         check_cache(instance, [])
 
         run_describe_query(instance, files, storage_name, started_cluster, bucket)
-        check_cache_misses(instance, files, storage_name, started_cluster, bucket, 4)
+        check_cache_misses(instance, files, storage_name, started_cluster, bucket, 4 if storage_name == "url" else 1)
 
         instance.query("system drop schema cache")
 

From e3858107969d6f6363de343197608bf65693dd59 Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Thu, 4 Apr 2024 22:18:41 +0200
Subject: [PATCH 028/289] fix black

---
 tests/integration/test_storage_s3/test.py | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index 9d275575f8a..a4ed94c815b 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -1768,13 +1768,27 @@ def test_schema_inference_cache(started_cluster):
         check_cache(instance, [])
 
         run_describe_query(instance, files, storage_name, started_cluster, bucket)
-        check_cache_misses(instance, files, storage_name, started_cluster, bucket, 4 if storage_name == "url" else 1)
+        check_cache_misses(
+            instance,
+            files,
+            storage_name,
+            started_cluster,
+            bucket,
+            4 if storage_name == "url" else 1,
+        )
 
         instance.query("system drop schema cache")
         check_cache(instance, [])
 
         run_describe_query(instance, files, storage_name, started_cluster, bucket)
-        check_cache_misses(instance, files, storage_name, started_cluster, bucket, 4 if storage_name == "url" else 1)
+        check_cache_misses(
+            instance,
+            files,
+            storage_name,
+            started_cluster,
+            bucket,
+            4 if storage_name == "url" else 1,
+        )
 
         instance.query("system drop schema cache")
 

From 307f69380efbd7af9a3e897df04cc9307558ad91 Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Sun, 7 Apr 2024 09:02:43 +0000
Subject: [PATCH 029/289] support clamp function

---
 .../functions/conditional-functions.md        | 31 +++++++++
 src/Functions/clamp.cpp                       | 68 +++++++++++++++++++
 .../queries/0_stateless/03036_clamp.reference |  4 ++
 tests/queries/0_stateless/03036_clamp.sql     |  4 ++
 4 files changed, 107 insertions(+)
 create mode 100644 src/Functions/clamp.cpp
 create mode 100644 tests/queries/0_stateless/03036_clamp.reference
 create mode 100644 tests/queries/0_stateless/03036_clamp.sql

diff --git a/docs/en/sql-reference/functions/conditional-functions.md b/docs/en/sql-reference/functions/conditional-functions.md
index eb4e98961f1..c89de4d9958 100644
--- a/docs/en/sql-reference/functions/conditional-functions.md
+++ b/docs/en/sql-reference/functions/conditional-functions.md
@@ -234,3 +234,34 @@ SELECT least(toDateTime32(now() + toIntervalDay(1)), toDateTime64(now(), 3))
 :::note
 The type returned is a DateTime64 as the DataTime32 must be promoted to 64 bit for the comparison.
 :::
+
+## clamp
+
+Constrain the return value between A and B.
+
+**Syntax**
+
+``` sql
+if(x, min, max)
+```
+
+**Arguments**
+
+- `x` – Input value.
+- `min` – Limit the lower bound.
+- `max` – Limit the upper bound.
+
+**Returned values**
+
+If the value is less than the minimum value, return the minimum value; if it is greater than the maximum value, return the maximum value; otherwise, return the current value.
+
+Examples:
+
+```sql
+SELECT least(1, 2, 3) result,  toTypeName(result) type;
+```
+```response
+┌─result─┬─type────┐
+│      2 │ Float64 │
+└────────┴─────────┘
+```
\ No newline at end of file
diff --git a/src/Functions/clamp.cpp b/src/Functions/clamp.cpp
new file mode 100644
index 00000000000..38be5a28f28
--- /dev/null
+++ b/src/Functions/clamp.cpp
@@ -0,0 +1,68 @@
+#include <Functions/IFunction.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <DataTypes/getLeastSupertype.h>
+#include <Interpreters/castColumn.h>
+#include <Interpreters/Context.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+}
+
+
+class FunctionClamp : public IFunction
+{
+
+public:
+    static constexpr auto name = "clamp";
+
+    String getName() const override { return name; }
+    size_t getNumberOfArguments() const override { return 0; }
+    bool isVariadic() const override { return true; }
+    bool useDefaultImplementationForConstants() const override { return true; }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionClamp>(); }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & types) const override
+    {
+        if (types.size() != 3)
+            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Function {} must be 3 arguments", getName());
+
+        return getLeastSupertype(types);
+    }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+    {
+
+        size_t arg_size = arguments.size();
+        Columns converted_columns(arg_size);
+        for (size_t arg = 0; arg < arg_size; ++arg)
+            converted_columns[arg] = castColumn(arguments[arg], result_type)->convertToFullColumnIfConst();
+
+        auto result_column = result_type->createColumn();
+        for (size_t row_num = 0; row_num < input_rows_count; ++row_num)
+        {
+          size_t best_arg = 0;
+          
+          if (converted_columns[1]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) > 0)
+              best_arg = 1;
+          else if (converted_columns[2]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) < 0)
+              best_arg = 2;
+
+          result_column->insertFrom(*converted_columns[best_arg], row_num);
+        }
+
+        return result_column;
+    }
+
+};
+
+REGISTER_FUNCTION(Clamp)
+{
+    factory.registerFunction<FunctionClamp>();
+}
+}
diff --git a/tests/queries/0_stateless/03036_clamp.reference b/tests/queries/0_stateless/03036_clamp.reference
new file mode 100644
index 00000000000..bd0d34dabea
--- /dev/null
+++ b/tests/queries/0_stateless/03036_clamp.reference
@@ -0,0 +1,4 @@
+10
+20
+15
+b
diff --git a/tests/queries/0_stateless/03036_clamp.sql b/tests/queries/0_stateless/03036_clamp.sql
new file mode 100644
index 00000000000..8250325661a
--- /dev/null
+++ b/tests/queries/0_stateless/03036_clamp.sql
@@ -0,0 +1,4 @@
+SELECT clamp(1, 10, 20);
+SELECT clamp(30, 10, 20);
+SELECT clamp(15, 10, 20);
+SELECT clamp('a', 'b', 'c');
\ No newline at end of file

From 8faa1487549e1dae0ca27d0550d7c90dd3102668 Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Mon, 8 Apr 2024 06:44:11 +0000
Subject: [PATCH 030/289] batter

---
 docs/en/sql-reference/functions/conditional-functions.md | 4 ++--
 src/Functions/clamp.cpp                                  | 1 -
 tests/queries/0_stateless/03036_clamp.reference          | 4 ++++
 tests/queries/0_stateless/03036_clamp.sql                | 6 +++++-
 4 files changed, 11 insertions(+), 4 deletions(-)

diff --git a/docs/en/sql-reference/functions/conditional-functions.md b/docs/en/sql-reference/functions/conditional-functions.md
index c89de4d9958..f19386af9f1 100644
--- a/docs/en/sql-reference/functions/conditional-functions.md
+++ b/docs/en/sql-reference/functions/conditional-functions.md
@@ -242,7 +242,7 @@ Constrain the return value between A and B.
 **Syntax**
 
 ``` sql
-if(x, min, max)
+clamp(x, min, max)
 ```
 
 **Arguments**
@@ -258,7 +258,7 @@ If the value is less than the minimum value, return the minimum value; if it is
 Examples:
 
 ```sql
-SELECT least(1, 2, 3) result,  toTypeName(result) type;
+SELECT clamp(1, 2, 3) result,  toTypeName(result) type;
 ```
 ```response
 ┌─result─┬─type────┐
diff --git a/src/Functions/clamp.cpp b/src/Functions/clamp.cpp
index 38be5a28f28..0210d135235 100644
--- a/src/Functions/clamp.cpp
+++ b/src/Functions/clamp.cpp
@@ -37,7 +37,6 @@ public:
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
     {
-
         size_t arg_size = arguments.size();
         Columns converted_columns(arg_size);
         for (size_t arg = 0; arg < arg_size; ++arg)
diff --git a/tests/queries/0_stateless/03036_clamp.reference b/tests/queries/0_stateless/03036_clamp.reference
index bd0d34dabea..bea85d8ccdd 100644
--- a/tests/queries/0_stateless/03036_clamp.reference
+++ b/tests/queries/0_stateless/03036_clamp.reference
@@ -2,3 +2,7 @@
 20
 15
 b
+0
+['hello']
+-1
+234
diff --git a/tests/queries/0_stateless/03036_clamp.sql b/tests/queries/0_stateless/03036_clamp.sql
index 8250325661a..8d4f2112830 100644
--- a/tests/queries/0_stateless/03036_clamp.sql
+++ b/tests/queries/0_stateless/03036_clamp.sql
@@ -1,4 +1,8 @@
 SELECT clamp(1, 10, 20);
 SELECT clamp(30, 10, 20);
 SELECT clamp(15, 10, 20);
-SELECT clamp('a', 'b', 'c');
\ No newline at end of file
+SELECT clamp('a', 'b', 'c');
+SELECT clamp(today(), yesterday() - 10, yesterday() + 10) - today()
+SELECT clamp([], ['hello'], ['world']);
+SELECT clamp(-1., -1000., 18446744073709551615.);
+SELECT clamp(toNullable(123), 234, 456);

From a6d088bed8ff87c1901077b7c8960034445aa9d4 Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Mon, 8 Apr 2024 10:35:53 +0000
Subject: [PATCH 031/289] batter

---
 src/Functions/clamp.cpp | 19 +++++++++++--------
 1 file changed, 11 insertions(+), 8 deletions(-)

diff --git a/src/Functions/clamp.cpp b/src/Functions/clamp.cpp
index 0210d135235..dc0ddffbd82 100644
--- a/src/Functions/clamp.cpp
+++ b/src/Functions/clamp.cpp
@@ -11,6 +11,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int BAD_ARGUMENTS;
 }
 
 
@@ -30,7 +31,7 @@ public:
     DataTypePtr getReturnTypeImpl(const DataTypes & types) const override
     {
         if (types.size() != 3)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Function {} must be 3 arguments", getName());
+            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Function {} requires 3 arguments", getName());
 
         return getLeastSupertype(types);
     }
@@ -41,18 +42,20 @@ public:
         Columns converted_columns(arg_size);
         for (size_t arg = 0; arg < arg_size; ++arg)
             converted_columns[arg] = castColumn(arguments[arg], result_type)->convertToFullColumnIfConst();
+        if (converted_columns[1]->compareAt(0, 0, *converted_columns[2], 1) > 0)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Function {} the minimum value cannot be greater than the maximum value", getName());
 
         auto result_column = result_type->createColumn();
         for (size_t row_num = 0; row_num < input_rows_count; ++row_num)
         {
-          size_t best_arg = 0;
-          
-          if (converted_columns[1]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) > 0)
-              best_arg = 1;
-          else if (converted_columns[2]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) < 0)
-              best_arg = 2;
+            size_t best_arg = 0;
+            
+            if (converted_columns[1]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) > 0)
+                best_arg = 1;
+            else if (converted_columns[2]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) < 0)
+                best_arg = 2;
 
-          result_column->insertFrom(*converted_columns[best_arg], row_num);
+            result_column->insertFrom(*converted_columns[best_arg], row_num);
         }
 
         return result_column;

From 0d6426d781538b899acfcfbff736f16422097466 Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Mon, 8 Apr 2024 13:34:54 +0000
Subject: [PATCH 032/289] batter

---
 tests/queries/0_stateless/03036_clamp.reference | 2 ++
 tests/queries/0_stateless/03036_clamp.sql       | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/03036_clamp.reference b/tests/queries/0_stateless/03036_clamp.reference
index bea85d8ccdd..5c8de57794d 100644
--- a/tests/queries/0_stateless/03036_clamp.reference
+++ b/tests/queries/0_stateless/03036_clamp.reference
@@ -6,3 +6,5 @@ b
 ['hello']
 -1
 234
+null
+null
\ No newline at end of file
diff --git a/tests/queries/0_stateless/03036_clamp.sql b/tests/queries/0_stateless/03036_clamp.sql
index 8d4f2112830..e075096f8ef 100644
--- a/tests/queries/0_stateless/03036_clamp.sql
+++ b/tests/queries/0_stateless/03036_clamp.sql
@@ -6,3 +6,5 @@ SELECT clamp(today(), yesterday() - 10, yesterday() + 10) - today()
 SELECT clamp([], ['hello'], ['world']);
 SELECT clamp(-1., -1000., 18446744073709551615.);
 SELECT clamp(toNullable(123), 234, 456);
+select clamp(1, null, 5);
+select clamp(1, 6, null);
\ No newline at end of file

From 5d36d1aa4efad0843d4a9389003c8389f7b2e48a Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Mon, 8 Apr 2024 13:53:33 +0000
Subject: [PATCH 033/289] style

---
 src/Functions/clamp.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Functions/clamp.cpp b/src/Functions/clamp.cpp
index dc0ddffbd82..0593c6c6b16 100644
--- a/src/Functions/clamp.cpp
+++ b/src/Functions/clamp.cpp
@@ -49,7 +49,6 @@ public:
         for (size_t row_num = 0; row_num < input_rows_count; ++row_num)
         {
             size_t best_arg = 0;
-            
             if (converted_columns[1]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) > 0)
                 best_arg = 1;
             else if (converted_columns[2]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) < 0)

From 88548eb19eb07ea29c8d603d77a43039844a351c Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 8 Apr 2024 18:59:04 +0000
Subject: [PATCH 034/289] Fix exception message during writing to partitioned
 s3 path woth globs

---
 src/Storages/StorageS3.cpp                    | 22 +++++++++++++------
 src/Storages/StorageS3.h                      |  6 +++--
 ...rite_to_globbed_partitioned_path.reference |  0
 ...7_s3_write_to_globbed_partitioned_path.sql |  2 ++
 4 files changed, 21 insertions(+), 9 deletions(-)
 create mode 100644 tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.reference
 create mode 100644 tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.sql

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 6cda0fca60b..c0802d02120 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -207,7 +207,7 @@ public:
         , list_objects_scheduler(threadPoolCallbackRunner<ListObjectsOutcome>(list_objects_pool, "ListObjects"))
         , file_progress_callback(file_progress_callback_)
     {
-        if (globbed_uri.bucket.find_first_of("*?{") != std::string::npos)
+        if (globbed_uri.bucket.find_first_of("*?{") != globbed_uri.bucket.npos)
             throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION, "Expression can not have wildcards inside bucket name");
 
         const String key_prefix = globbed_uri.key.substr(0, globbed_uri.key.find_first_of("*?{"));
@@ -1194,7 +1194,7 @@ void ReadFromStorageS3Step::createIterator(const ActionsDAG::Node * predicate)
 
 void ReadFromStorageS3Step::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
-    if (storage.partition_by && query_configuration.withWildcard())
+    if (storage.partition_by && query_configuration.withPartitionWildcard())
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Reading from a partitioned S3 storage is not implemented yet");
 
     createIterator(nullptr);
@@ -1249,12 +1249,16 @@ SinkToStoragePtr StorageS3::write(const ASTPtr & query, const StorageMetadataPtr
 {
     auto query_configuration = updateConfigurationAndGetCopy(local_context);
 
+    if (query_configuration.withGlobsIgnorePartitionWildcard())
+        throw Exception(ErrorCodes::DATABASE_ACCESS_DENIED,
+                        "S3 key '{}' contains globs, so the table is in readonly mode", query_configuration.url.key);
+
     auto sample_block = metadata_snapshot->getSampleBlock();
     auto chosen_compression_method = chooseCompressionMethod(query_configuration.keys.back(), query_configuration.compression_method);
     auto insert_query = std::dynamic_pointer_cast<ASTInsertQuery>(query);
 
     auto partition_by_ast = insert_query ? (insert_query->partition_by ? insert_query->partition_by : partition_by) : nullptr;
-    bool is_partitioned_implementation = partition_by_ast && query_configuration.withWildcard();
+    bool is_partitioned_implementation = partition_by_ast && query_configuration.withPartitionWildcard();
 
     if (is_partitioned_implementation)
     {
@@ -1271,10 +1275,6 @@ SinkToStoragePtr StorageS3::write(const ASTPtr & query, const StorageMetadataPtr
     }
     else
     {
-        if (query_configuration.withGlobs())
-            throw Exception(ErrorCodes::DATABASE_ACCESS_DENIED,
-                            "S3 key '{}' contains globs, so the table is in readonly mode", query_configuration.url.key);
-
         bool truncate_in_insert = local_context->getSettingsRef().s3_truncate_on_insert;
 
         if (!truncate_in_insert && S3::objectExists(*query_configuration.client, query_configuration.url.bucket, query_configuration.keys.back(), query_configuration.url.version_id, query_configuration.request_settings))
@@ -1460,6 +1460,14 @@ void StorageS3::Configuration::connect(const ContextPtr & context)
         credentials.GetSessionToken());
 }
 
+bool StorageS3::Configuration::withGlobsIgnorePartitionWildcard() const
+{
+    if (!withPartitionWildcard())
+        return withGlobs();
+
+    return PartitionedSink::replaceWildcards(getPath(), "").find_first_of("*?{") != std::string::npos;
+}
+
 void StorageS3::processNamedCollectionResult(StorageS3::Configuration & configuration, const NamedCollection & collection)
 {
     validateNamedCollection(collection, required_configuration_keys, optional_configuration_keys);
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index 19cbfaa6f08..e657db7bd35 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -274,7 +274,7 @@ public:
     {
         Configuration() = default;
 
-        String getPath() const { return url.key; }
+        const String & getPath() const { return url.key; }
 
         bool update(const ContextPtr & context);
 
@@ -282,13 +282,15 @@ public:
 
         bool withGlobs() const { return url.key.find_first_of("*?{") != std::string::npos; }
 
-        bool withWildcard() const
+        bool withPartitionWildcard() const
         {
             static const String PARTITION_ID_WILDCARD = "{_partition_id}";
             return url.bucket.find(PARTITION_ID_WILDCARD) != String::npos
                 || keys.back().find(PARTITION_ID_WILDCARD) != String::npos;
         }
 
+        bool withGlobsIgnorePartitionWildcard() const;
+
         S3::URI url;
         S3::AuthSettings auth_settings;
         S3Settings::RequestSettings request_settings;
diff --git a/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.reference b/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.sql b/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.sql
new file mode 100644
index 00000000000..400bc790f0b
--- /dev/null
+++ b/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.sql
@@ -0,0 +1,2 @@
+insert into function s3('http://localhost:11111/test/data_*_{_partition_id}.csv') partition by number % 3 select * from numbers(10); -- {serverError DATABASE_ACCESS_DENIED}
+

From 21ab0e4ea27b389ab697cb5f045a9600bd0fa7c2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 8 Apr 2024 19:01:00 +0000
Subject: [PATCH 035/289] Remove bad change

---
 src/Storages/StorageS3.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index c0802d02120..8de139ce366 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -207,7 +207,7 @@ public:
         , list_objects_scheduler(threadPoolCallbackRunner<ListObjectsOutcome>(list_objects_pool, "ListObjects"))
         , file_progress_callback(file_progress_callback_)
     {
-        if (globbed_uri.bucket.find_first_of("*?{") != globbed_uri.bucket.npos)
+        if (globbed_uri.bucket.find_first_of("*?{") != std::string::npos)
             throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION, "Expression can not have wildcards inside bucket name");
 
         const String key_prefix = globbed_uri.key.substr(0, globbed_uri.key.find_first_of("*?{"));

From 78dd23fd83e541c73b2fec0bc6bdf19d8d5b9297 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 8 Apr 2024 21:23:51 +0200
Subject: [PATCH 036/289] Don't run new test in fasttest

---
 .../0_stateless/03037_s3_write_to_globbed_partitioned_path.sql  | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.sql b/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.sql
index 400bc790f0b..1de89a593b0 100644
--- a/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.sql
+++ b/tests/queries/0_stateless/03037_s3_write_to_globbed_partitioned_path.sql
@@ -1,2 +1,4 @@
+-- Tags: no-fasttest
+
 insert into function s3('http://localhost:11111/test/data_*_{_partition_id}.csv') partition by number % 3 select * from numbers(10); -- {serverError DATABASE_ACCESS_DENIED}
 

From 8accf395fb9cb3f2b896151ab09a902c674b9809 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 8 Apr 2024 20:37:06 +0000
Subject: [PATCH 037/289] Fix for HDFS and Azure

---
 src/Storages/HDFS/StorageHDFS.cpp             |  4 ++++
 src/Storages/StorageAzureBlob.cpp             | 19 +++++++++++++------
 src/Storages/StorageAzureBlob.h               |  4 +++-
 .../test_storage_azure_blob_storage/test.py   | 14 ++++++++++++++
 tests/integration/test_storage_hdfs/test.py   | 10 ++++++++++
 5 files changed, 44 insertions(+), 7 deletions(-)

diff --git a/src/Storages/HDFS/StorageHDFS.cpp b/src/Storages/HDFS/StorageHDFS.cpp
index 93cf64f30a0..fe5d590770e 100644
--- a/src/Storages/HDFS/StorageHDFS.cpp
+++ b/src/Storages/HDFS/StorageHDFS.cpp
@@ -1065,6 +1065,10 @@ SinkToStoragePtr StorageHDFS::write(const ASTPtr & query, const StorageMetadataP
 
     if (is_partitioned_implementation)
     {
+        String path = current_uri.substr(current_uri.find('/', current_uri.find("//") + 2));
+        if (PartitionedSink::replaceWildcards(path, "").find_first_of("*?{") != std::string::npos)
+            throw Exception(ErrorCodes::DATABASE_ACCESS_DENIED, "URI '{}' contains globs, so the table is in readonly mode", uris.back());
+
         return std::make_shared<PartitionedHDFSSink>(
             partition_by_ast,
             current_uri,
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 306a5eac8e5..1eb18021653 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -462,6 +462,13 @@ Poco::URI StorageAzureBlob::Configuration::getConnectionURL() const
     return Poco::URI(parsed_connection_string.BlobServiceUrl.GetAbsoluteUrl());
 }
 
+bool StorageAzureBlob::Configuration::withGlobsIgnorePartitionWildcard() const
+{
+    if (!withPartitionWildcard())
+        return withGlobs();
+
+    return PartitionedSink::replaceWildcards(getPath(), "").find_first_of("*?{") != std::string::npos;
+}
 
 StorageAzureBlob::StorageAzureBlob(
     const Configuration & configuration_,
@@ -749,7 +756,7 @@ void StorageAzureBlob::read(
     size_t max_block_size,
     size_t num_streams)
 {
-    if (partition_by && configuration.withWildcard())
+    if (partition_by && configuration.withPartitionWildcard())
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Reading from a partitioned Azure storage is not implemented yet");
 
     auto this_ptr = std::static_pointer_cast<StorageAzureBlob>(shared_from_this());
@@ -836,12 +843,16 @@ void ReadFromAzureBlob::initializePipeline(QueryPipelineBuilder & pipeline, cons
 
 SinkToStoragePtr StorageAzureBlob::write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
+    if (configuration.withGlobsIgnorePartitionWildcard())
+        throw Exception(ErrorCodes::DATABASE_ACCESS_DENIED,
+                        "AzureBlobStorage key '{}' contains globs, so the table is in readonly mode", configuration.blob_path);
+
     auto sample_block = metadata_snapshot->getSampleBlock();
     auto chosen_compression_method = chooseCompressionMethod(configuration.blobs_paths.back(), configuration.compression_method);
     auto insert_query = std::dynamic_pointer_cast<ASTInsertQuery>(query);
 
     auto partition_by_ast = insert_query ? (insert_query->partition_by ? insert_query->partition_by : partition_by) : nullptr;
-    bool is_partitioned_implementation = partition_by_ast && configuration.withWildcard();
+    bool is_partitioned_implementation = partition_by_ast && configuration.withPartitionWildcard();
 
     if (is_partitioned_implementation)
     {
@@ -857,10 +868,6 @@ SinkToStoragePtr StorageAzureBlob::write(const ASTPtr & query, const StorageMeta
     }
     else
     {
-        if (configuration.withGlobs())
-            throw Exception(ErrorCodes::DATABASE_ACCESS_DENIED,
-                            "AzureBlobStorage key '{}' contains globs, so the table is in readonly mode", configuration.blob_path);
-
         bool truncate_in_insert = local_context->getSettingsRef().azure_truncate_on_insert;
 
         if (!truncate_in_insert && object_storage->exists(StoredObject(configuration.blob_path)))
diff --git a/src/Storages/StorageAzureBlob.h b/src/Storages/StorageAzureBlob.h
index 3f1ba33f636..928a8204bb2 100644
--- a/src/Storages/StorageAzureBlob.h
+++ b/src/Storages/StorageAzureBlob.h
@@ -37,12 +37,14 @@ public:
 
         bool withGlobs() const { return blob_path.find_first_of("*?{") != std::string::npos; }
 
-        bool withWildcard() const
+        bool withPartitionWildcard() const
         {
             static const String PARTITION_ID_WILDCARD = "{_partition_id}";
             return blobs_paths.back().find(PARTITION_ID_WILDCARD) != String::npos;
         }
 
+        bool withGlobsIgnorePartitionWildcard() const;
+
         Poco::URI getConnectionURL() const;
 
         std::string connection_url;
diff --git a/tests/integration/test_storage_azure_blob_storage/test.py b/tests/integration/test_storage_azure_blob_storage/test.py
index 7d30265e4f8..1c87feee297 100644
--- a/tests/integration/test_storage_azure_blob_storage/test.py
+++ b/tests/integration/test_storage_azure_blob_storage/test.py
@@ -1323,6 +1323,20 @@ def test_format_detection(cluster):
     assert result == expected_result
 
 
+def test_write_to_globbed_partitioned_path(cluster):
+    node = cluster.instances["node"]
+    storage_account_url = cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]
+    account_name = "devstoreaccount1"
+    account_key = "Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw=="
+    error = azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_data_*_{{_partition_id}}', '{account_name}', '{account_key}', 'CSV', 'auto', 'x UInt64') partition by 42 select 42",
+        expect_error="true",
+    )
+
+    assert "DATABASE_ACCESS_DENIED" in error
+
+
 def test_parallel_read(cluster):
     node = cluster.instances["node"]
     connection_string = cluster.env_variables["AZURITE_CONNECTION_STRING"]
diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index 9dec1954406..5daf8618036 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -1116,6 +1116,16 @@ def test_format_detection(started_cluster):
     assert expected_result == result
 
 
+def test_write_to_globbed_partitioned_path(started_cluster):
+    node = started_cluster.instances["node1"]
+
+    error = node.query_and_get_error(
+        "insert into function hdfs('hdfs://hdfs1:9000/test_data_*_{_partition_id}.csv') partition by 42 select 42"
+    )
+
+    assert "DATABASE_ACCESS_DENIED" in error
+
+
 if __name__ == "__main__":
     cluster.start()
     input("Cluster created, press any key to destroy...")

From 08f700118f266234ad3eba15ea95f91a85d81db8 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Tue, 9 Apr 2024 13:24:37 +0800
Subject: [PATCH 038/289] [doc] update npy format data types

---
 docs/en/interfaces/formats.md | 33 ++++++++++++++++-----------------
 1 file changed, 16 insertions(+), 17 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 03cf345349e..cc3ea467ab1 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -2465,23 +2465,22 @@ Result:
 
 ## Npy {#data-format-npy}
 
-This function is designed to load a NumPy array from a .npy file into ClickHouse. The NumPy file format is a binary format used for efficiently storing arrays of numerical data. During import, ClickHouse treats top level dimension as an array of rows with single column. Supported Npy data types and their corresponding type in ClickHouse:
-| Npy type | ClickHouse type |
-|:--------:|:---------------:|
-| b1       |    UInt8        |
-| i1       |    Int8         |
-| i2       |    Int16        |
-| i4       |    Int32        |
-| i8       |    Int64        |
-| u1       |    UInt8        |
-| u2       |    UInt16       |
-| u4       |    UInt32       |
-| u8       |    UInt64       |
-| f2       |    Float32      |
-| f4       |    Float32      |
-| f8       |    Float64      |
-| S        |    String       |
-| U        |    String       |
+This function is designed to load a NumPy array from a .npy file into ClickHouse. The NumPy file format is a binary format used for efficiently storing arrays of numerical data. During import, ClickHouse treats top level dimension as an array of rows with single column. Supported Npy data types and their corresponding type in ClickHouse: 
+
+| Npy data type (`INSERT`) | ClickHouse data type                                            | Npy data type (`SELECT`) |
+|--------------------------|-----------------------------------------------------------------|--------------------------|
+| `i1`                     | [Int8](/docs/en/sql-reference/data-types/int-uint.md)           | `i1`                     |
+| `i2`                     | [Int16](/docs/en/sql-reference/data-types/int-uint.md)          | `i2`                     |
+| `i4`                     | [Int32](/docs/en/sql-reference/data-types/int-uint.md)          | `i4`                     |
+| `i8`                     | [Int64](/docs/en/sql-reference/data-types/int-uint.md)          | `i8`                     |
+| `u1`, `b1`               | [UInt8](/docs/en/sql-reference/data-types/int-uint.md)          | `u1`                     |
+| `u2`                     | [UInt16](/docs/en/sql-reference/data-types/int-uint.md)         | `u2`                     |
+| `u4`                     | [UInt32](/docs/en/sql-reference/data-types/int-uint.md)         | `u4`                     |
+| `u8`                     | [UInt64](/docs/en/sql-reference/data-types/int-uint.md)         | `u8`                     |
+| `f2`, `f4`               | [Float32](/docs/en/sql-reference/data-types/float.md)           | `f4`                     |
+| `f8`                     | [Float64](/docs/en/sql-reference/data-types/float.md)           | `f8`                     |
+| `S`, `U`                 | [String](/docs/en/sql-reference/data-types/string.md)           | `S`                      |
+|                          | [FixedString](/docs/en/sql-reference/data-types/fixedstring.md) | `S`                      |
 
 **Example of saving an array in .npy format using Python**
 

From c0174fa17efc766bb49db0be67b6b5f7383429fc Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Tue, 9 Apr 2024 14:30:14 +0800
Subject: [PATCH 039/289] [feature] add npy output format

---
 docs/en/interfaces/formats.md                 |   8 +
 src/Formats/registerFormats.cpp               |   6 +-
 .../Formats/Impl/NpyOutputFormat.cpp          | 223 ++++++++++++++++++
 src/Processors/Formats/Impl/NpyOutputFormat.h |  66 ++++++
 .../02895_npy_output_format.reference         |  60 +++++
 .../0_stateless/02895_npy_output_format.sh    | 110 +++++++++
 6 files changed, 471 insertions(+), 2 deletions(-)
 create mode 100644 src/Processors/Formats/Impl/NpyOutputFormat.cpp
 create mode 100644 src/Processors/Formats/Impl/NpyOutputFormat.h
 create mode 100644 tests/queries/0_stateless/02895_npy_output_format.reference
 create mode 100755 tests/queries/0_stateless/02895_npy_output_format.sh

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index cc3ea467ab1..f4b082c57ab 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -2507,6 +2507,14 @@ Result:
 └───────────────┘
 ```
 
+**Selecting Data**
+
+You can select data from a ClickHouse table and save them into some file in the Npy format by the following command:
+
+```bash
+$ clickhouse-client --query="SELECT {column} FROM {some_table} FORMAT Npy" > {filename.npy}
+```
+
 ## LineAsString {#lineasstring}
 
 In this format, every line of input data is interpreted as a single string value. This format can only be parsed for table with a single field of type [String](/docs/en/sql-reference/data-types/string.md). The remaining columns must be set to [DEFAULT](/docs/en/sql-reference/statements/create/table.md/#default) or [MATERIALIZED](/docs/en/sql-reference/statements/create/table.md/#materialized), or omitted.
diff --git a/src/Formats/registerFormats.cpp b/src/Formats/registerFormats.cpp
index cc9cf380693..2070956883c 100644
--- a/src/Formats/registerFormats.cpp
+++ b/src/Formats/registerFormats.cpp
@@ -76,6 +76,8 @@ void registerInputFormatCustomSeparated(FormatFactory & factory);
 void registerOutputFormatCustomSeparated(FormatFactory & factory);
 void registerInputFormatCapnProto(FormatFactory & factory);
 void registerOutputFormatCapnProto(FormatFactory & factory);
+void registerInputFormatNpy(FormatFactory & factory);
+void registerOutputFormatNpy(FormatFactory & factory);
 
 /// Output only (presentational) formats.
 
@@ -103,7 +105,6 @@ void registerInputFormatMySQLDump(FormatFactory & factory);
 void registerInputFormatParquetMetadata(FormatFactory & factory);
 void registerInputFormatDWARF(FormatFactory & factory);
 void registerInputFormatOne(FormatFactory & factory);
-void registerInputFormatNpy(FormatFactory & factory);
 
 #if USE_HIVE
 void registerInputFormatHiveText(FormatFactory & factory);
@@ -221,6 +222,8 @@ void registerFormats()
     registerOutputFormatAvro(factory);
     registerInputFormatArrow(factory);
     registerOutputFormatArrow(factory);
+    registerInputFormatNpy(factory);
+    registerOutputFormatNpy(factory);
 
     registerOutputFormatPretty(factory);
     registerOutputFormatPrettyCompact(factory);
@@ -251,7 +254,6 @@ void registerFormats()
     registerInputFormatParquetMetadata(factory);
     registerInputFormatDWARF(factory);
     registerInputFormatOne(factory);
-    registerInputFormatNpy(factory);
 
     registerNonTrivialPrefixAndSuffixCheckerJSONEachRow(factory);
     registerNonTrivialPrefixAndSuffixCheckerJSONAsString(factory);
diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
new file mode 100644
index 00000000000..4a4af67b07e
--- /dev/null
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -0,0 +1,223 @@
+#include <Processors/Formats/Impl/NpyOutputFormat.h>
+
+#include <Core/TypeId.h>
+#include <DataTypes/DataTypeFixedString.h>
+#include <DataTypes/DataTypeArray.h>
+#include <Columns/ColumnsNumber.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnArray.h>
+#include <IO/WriteHelpers.h>
+#include <Formats/FormatFactory.h>
+
+#include <Common/assert_cast.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int TOO_MANY_COLUMNS;
+    extern const int BAD_ARGUMENTS;
+    extern const int ILLEGAL_COLUMN;
+}
+
+namespace
+{
+
+template <typename ColumnType, typename ValueType>
+void writeNumpyNumbers(const ColumnPtr & column, WriteBuffer & buf)
+{
+    const auto * number_column = assert_cast<const ColumnType *>(column.get());
+    for (size_t i = 0; i < number_column->size(); ++i)
+        writeBinaryLittleEndian(ValueType(number_column->getElement(i)), buf);
+}
+
+template <typename ColumnType>
+void writeNumpyStrings(const ColumnPtr & column, size_t length, WriteBuffer & buf)
+{
+    const auto * string_column = assert_cast<const ColumnType *>(column.get());
+    for (size_t i = 0; i < string_column->size(); ++i)
+        buf.write(string_column->getDataAt(i).data, length);
+}
+
+}
+
+String NpyOutputFormat::NumpyDataType::str()
+{
+    std::ostringstream dtype;
+    dtype << endianness << type << std::to_string(size);
+    return dtype.str();
+}
+
+NpyOutputFormat::NpyOutputFormat(WriteBuffer & out_, const Block & header_) : IOutputFormat(header_, out_)
+{
+    const auto & header = getPort(PortKind::Main).getHeader();
+    auto data_types = header.getDataTypes();
+    if (data_types.size() > 1)
+        throw Exception(ErrorCodes::TOO_MANY_COLUMNS, "Expected single column for Npy output format, got {}", data_types.size());
+    data_type = data_types[0];
+}
+
+void NpyOutputFormat::initialize(const ColumnPtr & column)
+{
+    auto type = data_type;
+    ColumnPtr nested_column = column;
+    while (type->getTypeId() == TypeIndex::Array)
+    {
+        const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
+        numpy_shape.push_back(array_column->getOffsets()[0]);
+        type = assert_cast<const DataTypeArray *>(type.get())->getNestedType();
+        nested_column = array_column->getDataPtr();
+    }
+
+    switch (type->getTypeId())
+    {
+        case TypeIndex::Int8: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int8)); break;
+        case TypeIndex::Int16: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int16)); break;
+        case TypeIndex::Int32: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int32)); break;
+        case TypeIndex::Int64: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int64)); break;
+        case TypeIndex::UInt8: numpy_data_type = NumpyDataType('<', 'u', sizeof(UInt8)); break;
+        case TypeIndex::UInt16: numpy_data_type = NumpyDataType('<', 'u', sizeof(UInt16)); break;
+        case TypeIndex::UInt32: numpy_data_type = NumpyDataType('<', 'u', sizeof(UInt32)); break;
+        case TypeIndex::UInt64: numpy_data_type = NumpyDataType('<', 'u', sizeof(UInt64)); break;
+        case TypeIndex::Float32: numpy_data_type = NumpyDataType('<', 'f', sizeof(Float32)); break;
+        case TypeIndex::Float64: numpy_data_type = NumpyDataType('<', 'f', sizeof(Float64)); break;
+        case TypeIndex::FixedString: numpy_data_type = NumpyDataType('|', 'S', assert_cast<const DataTypeFixedString *>(type.get())->getN()); break;
+        case TypeIndex::String: numpy_data_type = NumpyDataType('|', 'S', 0); break;
+        default:
+            has_exception = true;
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Type {} is not supported for Npy output format", type->getName());
+    }
+    nested_data_type = type;
+}
+
+void NpyOutputFormat::consume(Chunk chunk)
+{
+    if (!has_exception)
+    {
+        num_rows += chunk.getNumRows();
+        auto column = chunk.getColumns()[0];
+
+        if (!is_initialized)
+        {
+            initialize(column);
+            is_initialized = true;
+        }
+
+        /// check shape
+        auto type = data_type;
+        ColumnPtr nested_column = column;
+        int dim = 0;
+        while (type->getTypeId() == TypeIndex::Array)
+        {
+            const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
+            const auto & array_offset = array_column->getOffsets();
+            for (size_t i = 1; i < array_offset.size(); ++i)
+            {
+                if (array_offset[i] - array_offset[i - 1] != numpy_shape[dim])
+                {
+                    has_exception = true;
+                    throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ClickHouse doesn't support object types, cannot format ragged nested sequences (which is a list of arrays with different shapes)");
+                }
+            }
+            type = assert_cast<const DataTypeArray *>(type.get())->getNestedType();
+            nested_column = array_column->getDataPtr();
+            dim++;
+        }
+
+        /// for type String, get maximum string length
+        if (type->getTypeId() == TypeIndex::String)
+        {
+            const auto & string_offsets = assert_cast<const ColumnString *>(nested_column.get())->getOffsets();
+            for (size_t i = 0; i < string_offsets.size(); ++i)
+            {
+                size_t string_length = static_cast<size_t>(string_offsets[i] - 1 - string_offsets[i - 1]);
+                numpy_data_type.size = numpy_data_type.size > string_length ? numpy_data_type.size : string_length;
+            }
+        }
+
+        columns.push_back(nested_column);
+    }
+}
+
+void NpyOutputFormat::finalizeImpl()
+{
+    if (!has_exception)
+    {
+        writeHeader();
+        writeColumns();
+    }
+}
+
+void NpyOutputFormat::writeHeader()
+{
+    std::ostringstream static_header;
+    static_header << MAGIC_STRING << MAJOR_VERSION << MINOR_VERSION;
+    String static_header_str = static_header.str();
+
+    std::ostringstream shape;
+    shape << '(' << std::to_string(num_rows) << ',';
+    for (auto dim : numpy_shape)
+        shape << std::to_string(dim) << ',';
+    shape << ')';
+
+    std::ostringstream dict;
+    dict << "{'descr':'" << numpy_data_type.str() << "','fortran_order':False,'shape':" << shape.str() << ",}";
+    String dict_str = dict.str();
+    String padding_str = "\n";
+
+    /// completes the length of the header, which is divisible by 64.
+    size_t dict_length = dict_str.length() + 1;
+    size_t header_length = static_header_str.length() + sizeof(UInt32) + dict_length;
+    if (header_length % 64)
+    {
+        header_length = ((header_length / 64) + 1) * 64;
+        dict_length = header_length - static_header_str.length() - sizeof(UInt32);
+        padding_str = std::string(dict_length - dict_str.length(), '\x20');
+        padding_str.back() = '\n';
+    }
+
+    out.write(static_header_str.data(), static_header_str.length());
+    writeBinaryLittleEndian(assert_cast<UInt32>(dict_length), out);
+    out.write(dict_str.data(), dict_str.length());
+    out.write(padding_str.data(), padding_str.length());
+}
+
+void NpyOutputFormat::writeColumns()
+{
+    for (auto column : columns)
+    {
+        switch (nested_data_type->getTypeId())
+        {
+            case TypeIndex::Int8: writeNumpyNumbers<ColumnInt8, Int8>(column, out); break;
+            case TypeIndex::Int16: writeNumpyNumbers<ColumnInt16, Int16>(column, out); break;
+            case TypeIndex::Int32: writeNumpyNumbers<ColumnInt32, Int32>(column, out); break;
+            case TypeIndex::Int64: writeNumpyNumbers<ColumnInt64, Int64>(column, out); break;
+            case TypeIndex::UInt8: writeNumpyNumbers<ColumnUInt8, UInt8>(column, out); break;
+            case TypeIndex::UInt16: writeNumpyNumbers<ColumnUInt16, UInt16>(column, out); break;
+            case TypeIndex::UInt32: writeNumpyNumbers<ColumnUInt32, UInt32>(column, out); break;
+            case TypeIndex::UInt64: writeNumpyNumbers<ColumnUInt64, UInt64>(column, out); break;
+            case TypeIndex::Float32: writeNumpyNumbers<ColumnFloat32, Float32>(column, out); break;
+            case TypeIndex::Float64: writeNumpyNumbers<ColumnFloat64, Float64>(column, out); break;
+            case TypeIndex::FixedString: writeNumpyStrings<ColumnFixedString>(column, numpy_data_type.size, out); break;
+            case TypeIndex::String: writeNumpyStrings<ColumnString>(column, numpy_data_type.size, out); break;
+            default: break;
+        }
+    }
+}
+
+void registerOutputFormatNpy(FormatFactory & factory)
+{
+    factory.registerOutputFormat("Npy",[](
+        WriteBuffer & buf,
+        const Block & sample,
+        const FormatSettings &)
+    {
+        return std::make_shared<NpyOutputFormat>(buf, sample);
+    });
+    factory.markFormatHasNoAppendSupport("Npy");
+}
+
+}
diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.h b/src/Processors/Formats/Impl/NpyOutputFormat.h
new file mode 100644
index 00000000000..083aa928b7c
--- /dev/null
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.h
@@ -0,0 +1,66 @@
+#pragma once
+
+#include <Core/Block.h>
+#include <IO/WriteBuffer.h>
+#include <IO/WriteBufferFromVector.h>
+#include <Processors/Formats/IRowOutputFormat.h>
+#include <Formats/FormatSettings.h>
+#include <Columns/IColumn.h>
+#include <Common/PODArray_fwd.h>
+
+#include <vector>
+#include <sstream>
+#include <string>
+
+
+namespace DB
+{
+
+/** Stream for output data in Npy format.
+  * https://numpy.org/doc/stable/reference/generated/numpy.lib.format.html
+  */
+class NpyOutputFormat : public IOutputFormat
+{
+public:
+    NpyOutputFormat(WriteBuffer & out_, const Block & header_);
+
+    String getName() const override { return "NpyOutputFormat"; }
+
+    String getContentType() const override { return "application/octet-stream"; }
+
+private:
+    struct NumpyDataType
+    {
+      char endianness;
+      char type;
+      size_t size;
+
+      NumpyDataType() = default;
+      NumpyDataType(char endianness_, char type_, size_t size_)
+        : endianness(endianness_), type(type_), size(size_) {}
+      String str();
+    };
+
+    void initialize(const ColumnPtr & column);
+    void consume(Chunk) override;
+    void finalizeImpl() override;
+    void writeHeader();
+    void writeColumns();
+
+    bool is_initialized = false;
+    bool has_exception = false;
+
+    DataTypePtr data_type;
+    DataTypePtr nested_data_type;
+    NumpyDataType numpy_data_type;
+    UInt64 num_rows = 0;
+    std::vector<UInt64> numpy_shape;
+    Columns columns;
+
+    /// static header (version 3.0)
+    constexpr static auto MAGIC_STRING = "\x93NUMPY";
+    constexpr static auto MAJOR_VERSION = '\x03';
+    constexpr static auto MINOR_VERSION = '\x00';
+};
+
+}
diff --git a/tests/queries/0_stateless/02895_npy_output_format.reference b/tests/queries/0_stateless/02895_npy_output_format.reference
new file mode 100644
index 00000000000..b599f1dceea
--- /dev/null
+++ b/tests/queries/0_stateless/02895_npy_output_format.reference
@@ -0,0 +1,60 @@
+-1
+-1
+-1
+-1
+-1
+-1
+-1
+-1
+-1
+-1
+-1
+-1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+0.1
+0.1
+0.1
+0.01
+0.01
+0.01
+npy
+npy
+npy
+npy
+npy
+npy
+array	Int8					
+array	Int16					
+array	Int32					
+array	Int64					
+array	UInt8					
+array	UInt16					
+array	UInt32					
+array	UInt64					
+array	Float32					
+array	Float64					
+array	String					
+array	String					
+[[[1],[2]],[[3],[4]]]
+[[[1],[2]],[[3],[4]]]
+[[[1],[2]],[[3],[4]]]
+[[0.1],[0.2]]
+[[0.1],[0.2]]
+[[0.1],[0.2]]
+[['abb','bbc'],['ccc','dddd']]
+[['abb','bbc'],['ccc','dddd']]
+[['abb','bbc'],['ccc','dddd']]
+array	Array(Array(Array(Int8)))					
+array	Array(Array(Float64))					
+array	Array(Array(String))					
diff --git a/tests/queries/0_stateless/02895_npy_output_format.sh b/tests/queries/0_stateless/02895_npy_output_format.sh
new file mode 100755
index 00000000000..e5226e88a8d
--- /dev/null
+++ b/tests/queries/0_stateless/02895_npy_output_format.sh
@@ -0,0 +1,110 @@
+#!/usr/bin/env bash
+# Tags: no-parallel
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY -q "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
+rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}/*
+chmod 777 ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
+
+${CLICKHOUSE_CLIENT} -q "DROP DATABASE IF EXISTS npy_output_02895;"
+${CLICKHOUSE_CLIENT} -q "CREATE DATABASE IF NOT EXISTS npy_output_02895;"
+
+### test common type
+${CLICKHOUSE_CLIENT} -q "CREATE TABLE IF NOT EXISTS npy_output_02895.common
+(
+    i1 Int8,
+    i2 Int16,
+    i4 Int32,
+    i8 Int64,
+    u1 UInt8,
+    u2 UInt16,
+    u4 UInt32,
+    u8 UInt64,
+    f4 Float32,
+    f8 Float64,
+    fs FixedString(10),
+    s String,
+    unknow Int128
+) Engine = MergeTree ORDER BY i1;"
+
+${CLICKHOUSE_CLIENT} -q "INSERT INTO npy_output_02895.common VALUES (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1), (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1), (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1);"
+
+${CLICKHOUSE_CLIENT} -n -q "SELECT * FROM npy_output_02895.common FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }"
+${CLICKHOUSE_CLIENT} -n -q "SELECT unknow FROM npy_output_02895.common FORMAT Npy; -- { clientError BAD_ARGUMENTS }"
+
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy') SELECT i1 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy') SELECT i2 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy') SELECT i4 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy') SELECT i8 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy') SELECT u1 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy') SELECT u2 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy') SELECT u4 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy') SELECT u8 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy') SELECT f4 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy') SELECT f8 FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy') SELECT fs FROM npy_output_02895.common;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy') SELECT s FROM npy_output_02895.common;"
+
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy');"
+
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy');"
+
+### test nested type
+${CLICKHOUSE_CLIENT} -q "CREATE TABLE IF NOT EXISTS npy_output_02895.nested
+(
+    i4 Array(Array(Array(Int8))),
+    f8 Array(Array(Float64)),
+    s Array(Array(String)),
+    unknow Array(Int128),
+    ragged_1 Array(Array(Int32)),
+    ragged_2 Array(Array(Int32))
+) Engine = MergeTree ORDER BY i4;"
+
+${CLICKHOUSE_CLIENT} -q "INSERT INTO npy_output_02895.nested VALUES ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2], [3, 4]], [[1, 2], [3]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2, 3], [4]], [[1, 2], [3]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1], [2, 3, 4]], [[1, 2], [3]]);"
+
+${CLICKHOUSE_CLIENT} -n -q "SELECT * FROM npy_output_02895.nested FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }"
+${CLICKHOUSE_CLIENT} -n -q "SELECT unknow FROM npy_output_02895.nested FORMAT Npy; -- { clientError BAD_ARGUMENTS }"
+${CLICKHOUSE_CLIENT} -n -q "SELECT ragged_1 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }"
+${CLICKHOUSE_CLIENT} -n -q "SELECT ragged_2 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }"
+
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy') SELECT i4 FROM npy_output_02895.nested;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy') SELECT f8 FROM npy_output_02895.nested;"
+${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy') SELECT s FROM npy_output_02895.nested;"
+
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy');"
+${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy');"
+
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy');"
+${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy');"
+
+${CLICKHOUSE_CLIENT} -q "DROP DATABASE IF EXISTS npy_output_02895;"
+
+rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}

From fe66d1b67a357155d35ca364a06c43cd44770056 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Tue, 9 Apr 2024 20:23:45 +0800
Subject: [PATCH 040/289] fix style

---
 .../Formats/Impl/NpyOutputFormat.cpp          | 45 ++++++++++---------
 src/Processors/Formats/Impl/NpyOutputFormat.h |  5 +--
 2 files changed, 25 insertions(+), 25 deletions(-)

diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
index 4a4af67b07e..d04d095e84f 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -8,6 +8,7 @@
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnArray.h>
 #include <IO/WriteHelpers.h>
+#include <IO/WriteBufferFromString.h>
 #include <Formats/FormatFactory.h>
 
 #include <Common/assert_cast.h>
@@ -46,8 +47,11 @@ void writeNumpyStrings(const ColumnPtr & column, size_t length, WriteBuffer & bu
 
 String NpyOutputFormat::NumpyDataType::str()
 {
-    std::ostringstream dtype;
-    dtype << endianness << type << std::to_string(size);
+    WriteBufferFromOwnString dtype;
+    writeChar(endianness, dtype);
+    writeChar(type, dtype);
+    writeIntText(size, dtype);
+
     return dtype.str();
 }
 
@@ -153,36 +157,33 @@ void NpyOutputFormat::finalizeImpl()
 
 void NpyOutputFormat::writeHeader()
 {
-    std::ostringstream static_header;
-    static_header << MAGIC_STRING << MAJOR_VERSION << MINOR_VERSION;
-    String static_header_str = static_header.str();
-
-    std::ostringstream shape;
-    shape << '(' << std::to_string(num_rows) << ',';
+    WriteBufferFromOwnString shape;
+    writeIntText(num_rows, shape);
+    writeChar(',', shape);
     for (auto dim : numpy_shape)
-        shape << std::to_string(dim) << ',';
-    shape << ')';
+    {
+        writeIntText(dim, shape);
+        writeChar(',', shape);
+    }
 
-    std::ostringstream dict;
-    dict << "{'descr':'" << numpy_data_type.str() << "','fortran_order':False,'shape':" << shape.str() << ",}";
-    String dict_str = dict.str();
-    String padding_str = "\n";
+    String dict = "{'descr':'" + numpy_data_type.str() + "','fortran_order':False,'shape':(" + shape.str() + "),}";
+    String padding = "\n";
 
     /// completes the length of the header, which is divisible by 64.
-    size_t dict_length = dict_str.length() + 1;
-    size_t header_length = static_header_str.length() + sizeof(UInt32) + dict_length;
+    size_t dict_length = dict.length() + 1;
+    size_t header_length = STATIC_HEADER_LENGTH + sizeof(UInt32) + dict_length;
     if (header_length % 64)
     {
         header_length = ((header_length / 64) + 1) * 64;
-        dict_length = header_length - static_header_str.length() - sizeof(UInt32);
-        padding_str = std::string(dict_length - dict_str.length(), '\x20');
-        padding_str.back() = '\n';
+        dict_length = header_length - STATIC_HEADER_LENGTH - sizeof(UInt32);
+        padding = std::string(dict_length - dict.length(), '\x20');
+        padding.back() = '\n';
     }
 
-    out.write(static_header_str.data(), static_header_str.length());
+    out.write(STATIC_HEADER, STATIC_HEADER_LENGTH);
     writeBinaryLittleEndian(assert_cast<UInt32>(dict_length), out);
-    out.write(dict_str.data(), dict_str.length());
-    out.write(padding_str.data(), padding_str.length());
+    out.write(dict.data(), dict.length());
+    out.write(padding.data(), padding.length());
 }
 
 void NpyOutputFormat::writeColumns()
diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.h b/src/Processors/Formats/Impl/NpyOutputFormat.h
index 083aa928b7c..a483420d2d6 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.h
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.h
@@ -58,9 +58,8 @@ private:
     Columns columns;
 
     /// static header (version 3.0)
-    constexpr static auto MAGIC_STRING = "\x93NUMPY";
-    constexpr static auto MAJOR_VERSION = '\x03';
-    constexpr static auto MINOR_VERSION = '\x00';
+    constexpr static auto STATIC_HEADER = "\x93NUMPY\x03\x00";
+    constexpr static size_t STATIC_HEADER_LENGTH = 8;
 };
 
 }

From 3c58e5873b24e0aec20a4c5b97c3ab6bb849c47e Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Tue, 9 Apr 2024 19:06:14 +0000
Subject: [PATCH 041/289] fix reading of {} with more than 1000 objects under
 each

---
 src/Storages/StorageS3.cpp | 25 ++++++++++++-------------
 1 file changed, 12 insertions(+), 13 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 85d9b45291c..ffe3213a4bc 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -214,10 +214,8 @@ public:
         expanded_keys = expandSelectionGlob(globbed_uri.key);
         expanded_keys_iter = expanded_keys.begin();
 
-        bool no_globs_in_key = fillBufferForKey(*expanded_keys_iter);
+        fillBufferForKey(*expanded_keys_iter);
         expanded_keys_iter++;
-        if (expanded_keys_iter == expanded_keys.end() && no_globs_in_key)
-            is_finished_for_key = true;
     }
 
     KeyWithInfoPtr next(size_t)
@@ -252,6 +250,7 @@ private:
             buffer_iter = buffer.begin();
             if (read_keys)
                 read_keys->insert(read_keys->end(), buffer.begin(), buffer.end());
+            is_finished_for_key = true;
             return true;
         }
 
@@ -306,17 +305,17 @@ private:
                 return answer;
             }
 
-            if (expanded_keys_iter != expanded_keys.end())
-            {
-                bool no_globs_in_key = fillBufferForKey(*expanded_keys_iter);
-                expanded_keys_iter++;
-                if (expanded_keys_iter == expanded_keys.end() && no_globs_in_key)
-                    is_finished_for_key = true;
-                continue;
-            }
-
             if (is_finished_for_key)
-                return {};
+            {
+                if (expanded_keys_iter != expanded_keys.end())
+                {
+                    fillBufferForKey(*expanded_keys_iter);
+                    expanded_keys_iter++;
+                    continue;
+                }
+                else
+                    return {};
+            }
 
             try
             {

From 093b71b8585161e91f571d9991e2d351effd10fa Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Tue, 9 Apr 2024 21:01:01 +0000
Subject: [PATCH 042/289] added test for selection globs with many files under

---
 tests/integration/test_storage_s3/test.py | 38 +++++++++++++++++++++++
 1 file changed, 38 insertions(+)

diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index a4ed94c815b..60b0e8792d7 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -678,6 +678,44 @@ def test_s3_glob_scheherazade(started_cluster):
     assert run_query(instance, query).splitlines() == ["1001\t1001\t1001\t1001"]
 
 
+# a bit modified version of scheherazade test
+# checks e.g. `prefix{1,2}/file*.csv`, where there are more than 1000 files under each of prefix1, prefix2.
+def test_s3_glob_many_objects_under_selection(started_cluster):
+    bucket = started_cluster.minio_bucket
+    instance = started_cluster.instances["dummy"]  # type: ClickHouseInstance
+    table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
+    values = "(1, 1, 1)"
+    jobs = []
+    for file_num in range(1100):
+
+        def create_files(file_num):
+            for folder_num in range(1, 3):
+                path = f"folder{folder_num}/file{file_num}.csv"
+                query = "insert into table function s3('http://{}:{}/{}/{}', 'CSV', '{}') values {}".format(
+                    started_cluster.minio_ip,
+                    MINIO_INTERNAL_PORT,
+                    bucket,
+                    path,
+                    table_format,
+                    values,
+                )
+                run_query(instance, query)
+
+        jobs.append(threading.Thread(target=create_files, args=(file_num,)))
+        jobs[-1].start()
+
+    for job in jobs:
+        job.join()
+
+    query = "select count(), sum(column1), sum(column2), sum(column3) from s3('http://{}:{}/{}/folder{{1,2}}/file*.csv', 'CSV', '{}')".format(
+        started_cluster.minio_redirect_host,
+        started_cluster.minio_redirect_port,
+        bucket,
+        table_format,
+    )
+    assert run_query(instance, query).splitlines() == ["2200\t2200\t2200\t2200"]
+
+
 def run_s3_mocks(started_cluster):
     script_dir = os.path.join(os.path.dirname(__file__), "s3_mocks")
     start_mock_servers(

From d9de697305522a1c267debaf13792ab900b16a83 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Wed, 10 Apr 2024 17:48:23 +0800
Subject: [PATCH 043/289] refactor test

---
 .../0_stateless/02895_npy_output_format.sh    | 165 +++++++++---------
 1 file changed, 82 insertions(+), 83 deletions(-)

diff --git a/tests/queries/0_stateless/02895_npy_output_format.sh b/tests/queries/0_stateless/02895_npy_output_format.sh
index e5226e88a8d..27274f6a925 100755
--- a/tests/queries/0_stateless/02895_npy_output_format.sh
+++ b/tests/queries/0_stateless/02895_npy_output_format.sh
@@ -10,101 +10,100 @@ mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}/*
 chmod 777 ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 
-${CLICKHOUSE_CLIENT} -q "DROP DATABASE IF EXISTS npy_output_02895;"
-${CLICKHOUSE_CLIENT} -q "CREATE DATABASE IF NOT EXISTS npy_output_02895;"
+${CLICKHOUSE_CLIENT} -n -q "
+    DROP DATABASE IF EXISTS npy_output_02895;
+    CREATE DATABASE IF NOT EXISTS npy_output_02895;
 
-### test common type
-${CLICKHOUSE_CLIENT} -q "CREATE TABLE IF NOT EXISTS npy_output_02895.common
-(
-    i1 Int8,
-    i2 Int16,
-    i4 Int32,
-    i8 Int64,
-    u1 UInt8,
-    u2 UInt16,
-    u4 UInt32,
-    u8 UInt64,
-    f4 Float32,
-    f8 Float64,
-    fs FixedString(10),
-    s String,
-    unknow Int128
-) Engine = MergeTree ORDER BY i1;"
+    CREATE TABLE IF NOT EXISTS npy_output_02895.common
+    (
+        i1 Int8,
+        i2 Int16,
+        i4 Int32,
+        i8 Int64,
+        u1 UInt8,
+        u2 UInt16,
+        u4 UInt32,
+        u8 UInt64,
+        f4 Float32,
+        f8 Float64,
+        fs FixedString(10),
+        s String,
+        unknow Int128
+    ) Engine = MergeTree ORDER BY i1;
 
-${CLICKHOUSE_CLIENT} -q "INSERT INTO npy_output_02895.common VALUES (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1), (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1), (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1);"
+    INSERT INTO npy_output_02895.common VALUES (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1), (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1), (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1);
 
-${CLICKHOUSE_CLIENT} -n -q "SELECT * FROM npy_output_02895.common FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }"
-${CLICKHOUSE_CLIENT} -n -q "SELECT unknow FROM npy_output_02895.common FORMAT Npy; -- { clientError BAD_ARGUMENTS }"
+    SELECT * FROM npy_output_02895.common FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }
+    SELECT unknow FROM npy_output_02895.common FORMAT Npy; -- { clientError BAD_ARGUMENTS }
 
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy') SELECT i1 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy') SELECT i2 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy') SELECT i4 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy') SELECT i8 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy') SELECT u1 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy') SELECT u2 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy') SELECT u4 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy') SELECT u8 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy') SELECT f4 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy') SELECT f8 FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy') SELECT fs FROM npy_output_02895.common;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy') SELECT s FROM npy_output_02895.common;"
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy') SELECT i1 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy') SELECT i2 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy') SELECT i4 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy') SELECT i8 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy') SELECT u1 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy') SELECT u2 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy') SELECT u4 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy') SELECT u8 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy') SELECT f4 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy') SELECT f8 FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy') SELECT fs FROM npy_output_02895.common;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy') SELECT s FROM npy_output_02895.common;
 
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy');"
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy');
 
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy');"
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy');
 
-### test nested type
-${CLICKHOUSE_CLIENT} -q "CREATE TABLE IF NOT EXISTS npy_output_02895.nested
-(
-    i4 Array(Array(Array(Int8))),
-    f8 Array(Array(Float64)),
-    s Array(Array(String)),
-    unknow Array(Int128),
-    ragged_1 Array(Array(Int32)),
-    ragged_2 Array(Array(Int32))
-) Engine = MergeTree ORDER BY i4;"
+    CREATE TABLE IF NOT EXISTS npy_output_02895.nested
+    (
+        i4 Array(Array(Array(Int8))),
+        f8 Array(Array(Float64)),
+        s Array(Array(String)),
+        unknow Array(Int128),
+        ragged_1 Array(Array(Int32)),
+        ragged_2 Array(Array(Int32))
+    ) Engine = MergeTree ORDER BY i4;
 
-${CLICKHOUSE_CLIENT} -q "INSERT INTO npy_output_02895.nested VALUES ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2], [3, 4]], [[1, 2], [3]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2, 3], [4]], [[1, 2], [3]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1], [2, 3, 4]], [[1, 2], [3]]);"
+    INSERT INTO npy_output_02895.nested VALUES ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2], [3, 4]], [[1, 2], [3]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2, 3], [4]], [[1, 2], [3]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1], [2, 3, 4]], [[1, 2], [3]]);
 
-${CLICKHOUSE_CLIENT} -n -q "SELECT * FROM npy_output_02895.nested FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }"
-${CLICKHOUSE_CLIENT} -n -q "SELECT unknow FROM npy_output_02895.nested FORMAT Npy; -- { clientError BAD_ARGUMENTS }"
-${CLICKHOUSE_CLIENT} -n -q "SELECT ragged_1 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }"
-${CLICKHOUSE_CLIENT} -n -q "SELECT ragged_2 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }"
+    SELECT * FROM npy_output_02895.nested FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }
+    SELECT unknow FROM npy_output_02895.nested FORMAT Npy; -- { clientError BAD_ARGUMENTS }
+    SELECT ragged_1 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
+    SELECT ragged_2 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
 
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy') SELECT i4 FROM npy_output_02895.nested;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy') SELECT f8 FROM npy_output_02895.nested;"
-${CLICKHOUSE_CLIENT} -q "INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy') SELECT s FROM npy_output_02895.nested;"
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy') SELECT i4 FROM npy_output_02895.nested;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy') SELECT f8 FROM npy_output_02895.nested;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy') SELECT s FROM npy_output_02895.nested;
 
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy');"
-${CLICKHOUSE_CLIENT} -q "SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy');"
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy');
 
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy');"
-${CLICKHOUSE_CLIENT} -q "DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy');"
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy');
 
-${CLICKHOUSE_CLIENT} -q "DROP DATABASE IF EXISTS npy_output_02895;"
+    DROP DATABASE IF EXISTS npy_output_02895;"
 
 rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}

From c9b05eac022254c71323d2715a0dc1a32ae9c2f7 Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Wed, 10 Apr 2024 12:02:01 +0000
Subject: [PATCH 044/289] fix test_s3_glob_many_objects_under_selection

---
 tests/integration/test_storage_s3/test.py | 26 ++++++++++++++++-------
 1 file changed, 18 insertions(+), 8 deletions(-)

diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index 60b0e8792d7..28b70911b77 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -678,19 +678,19 @@ def test_s3_glob_scheherazade(started_cluster):
     assert run_query(instance, query).splitlines() == ["1001\t1001\t1001\t1001"]
 
 
-# a bit modified version of scheherazade test
-# checks e.g. `prefix{1,2}/file*.csv`, where there are more than 1000 files under each of prefix1, prefix2.
+# a bit simplified version of scheherazade test
+# checks e.g. `prefix{1,2}/file*.csv`, where there are more than 1000 files under prefix1.
 def test_s3_glob_many_objects_under_selection(started_cluster):
     bucket = started_cluster.minio_bucket
     instance = started_cluster.instances["dummy"]  # type: ClickHouseInstance
     table_format = "column1 UInt32, column2 UInt32, column3 UInt32"
     values = "(1, 1, 1)"
     jobs = []
-    for file_num in range(1100):
+    for thread_num in range(16):
 
-        def create_files(file_num):
-            for folder_num in range(1, 3):
-                path = f"folder{folder_num}/file{file_num}.csv"
+        def create_files(thread_num):
+            for f_num in range(thread_num * 63, thread_num * 63 + 63):
+                path = f"folder1/file{f_num}.csv"
                 query = "insert into table function s3('http://{}:{}/{}/{}', 'CSV', '{}') values {}".format(
                     started_cluster.minio_ip,
                     MINIO_INTERNAL_PORT,
@@ -701,9 +701,19 @@ def test_s3_glob_many_objects_under_selection(started_cluster):
                 )
                 run_query(instance, query)
 
-        jobs.append(threading.Thread(target=create_files, args=(file_num,)))
+        jobs.append(threading.Thread(target=create_files, args=(thread_num,)))
         jobs[-1].start()
 
+    query = "insert into table function s3('http://{}:{}/{}/{}', 'CSV', '{}') values {}".format(
+        started_cluster.minio_ip,
+        MINIO_INTERNAL_PORT,
+        bucket,
+        f"folder2/file0.csv",
+        table_format,
+        values,
+    )
+    run_query(instance, query)
+
     for job in jobs:
         job.join()
 
@@ -713,7 +723,7 @@ def test_s3_glob_many_objects_under_selection(started_cluster):
         bucket,
         table_format,
     )
-    assert run_query(instance, query).splitlines() == ["2200\t2200\t2200\t2200"]
+    assert run_query(instance, query).splitlines() == ["1009\t1009\t1009\t1009"]
 
 
 def run_s3_mocks(started_cluster):

From 9975b6a0f5c313a2552a8169f5be555dd2f7f4ad Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Wed, 10 Apr 2024 20:18:30 +0800
Subject: [PATCH 045/289] fix build

---
 src/Processors/Formats/Impl/NpyOutputFormat.cpp | 4 ++--
 src/Processors/Formats/Impl/NpyOutputFormat.h   | 3 +--
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
index d04d095e84f..f43deb816e0 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -45,7 +45,7 @@ void writeNumpyStrings(const ColumnPtr & column, size_t length, WriteBuffer & bu
 
 }
 
-String NpyOutputFormat::NumpyDataType::str()
+String NpyOutputFormat::NumpyDataType::str() const
 {
     WriteBufferFromOwnString dtype;
     writeChar(endianness, dtype);
@@ -188,7 +188,7 @@ void NpyOutputFormat::writeHeader()
 
 void NpyOutputFormat::writeColumns()
 {
-    for (auto column : columns)
+    for (const auto & column : columns)
     {
         switch (nested_data_type->getTypeId())
         {
diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.h b/src/Processors/Formats/Impl/NpyOutputFormat.h
index a483420d2d6..f1d0216a8c3 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.h
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.h
@@ -9,7 +9,6 @@
 #include <Common/PODArray_fwd.h>
 
 #include <vector>
-#include <sstream>
 #include <string>
 
 
@@ -38,7 +37,7 @@ private:
       NumpyDataType() = default;
       NumpyDataType(char endianness_, char type_, size_t size_)
         : endianness(endianness_), type(type_), size(size_) {}
-      String str();
+      String str() const;
     };
 
     void initialize(const ColumnPtr & column);

From 9085816fcb25c34ffc4ce664f3f10b4c3aca160d Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Wed, 10 Apr 2024 23:06:51 +0800
Subject: [PATCH 046/289] remove from async test

---
 .../queries/0_stateless/02187_async_inserts_all_formats.python  | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02187_async_inserts_all_formats.python b/tests/queries/0_stateless/02187_async_inserts_all_formats.python
index fa555c78f8b..943e32d4cf2 100644
--- a/tests/queries/0_stateless/02187_async_inserts_all_formats.python
+++ b/tests/queries/0_stateless/02187_async_inserts_all_formats.python
@@ -38,7 +38,7 @@ def run_test(data_format, gen_data_template, settings):
 formats = (
     client.query(
         "SELECT name FROM system.formats WHERE is_input AND is_output \
-    AND name NOT IN ('CapnProto', 'RawBLOB', 'Template', 'ProtobufSingle', 'LineAsString', 'Protobuf', 'ProtobufList') ORDER BY name"
+    AND name NOT IN ('CapnProto', 'RawBLOB', 'Template', 'ProtobufSingle', 'LineAsString', 'Protobuf', 'ProtobufList', 'Npy') ORDER BY name"
     )
     .strip()
     .split("\n")

From 0669591e35e0b6f19c148ff941c2497a0e38435c Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Wed, 10 Apr 2024 17:33:48 +0000
Subject: [PATCH 047/289] small code cleanup

---
 src/Storages/StorageS3.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index ffe3213a4bc..acef213c1f4 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -237,7 +237,7 @@ public:
 private:
     using ListObjectsOutcome = Aws::S3::Model::ListObjectsV2Outcome;
 
-    bool fillBufferForKey(const std::string & uri_key)
+    void fillBufferForKey(const std::string & uri_key)
     {
         is_finished_for_key = false;
         const String key_prefix = uri_key.substr(0, uri_key.find_first_of("*?{"));
@@ -251,7 +251,7 @@ private:
             if (read_keys)
                 read_keys->insert(read_keys->end(), buffer.begin(), buffer.end());
             is_finished_for_key = true;
-            return true;
+            return;
         }
 
         request = {};
@@ -270,7 +270,7 @@ private:
 
         filter_dag = VirtualColumnUtils::createPathAndFileFilterDAG(predicate, virtual_columns);
         fillInternalBufferAssumeLocked();
-        return false;
+        return;
     }
 
     KeyWithInfoPtr nextAssumeLocked()

From b464d16d5fbb67797677d63d05d8bd9802821a7c Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Thu, 11 Apr 2024 11:34:56 +0800
Subject: [PATCH 048/289] refactor and fix type conversion

---
 .../Formats/Impl/NpyOutputFormat.cpp          | 139 ++++++++++--------
 src/Processors/Formats/Impl/NpyOutputFormat.h |  10 +-
 2 files changed, 87 insertions(+), 62 deletions(-)

diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
index f43deb816e0..d54fc7e68f2 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -55,6 +55,20 @@ String NpyOutputFormat::NumpyDataType::str() const
     return dtype.str();
 }
 
+String NpyOutputFormat::shapeStr() const
+{
+    WriteBufferFromOwnString shape;
+    writeIntText(num_rows, shape);
+    writeChar(',', shape);
+    for (UInt64 dim : numpy_shape)
+    {
+        writeIntText(dim, shape);
+        writeChar(',', shape);
+    }
+
+    return shape.str();
+}
+
 NpyOutputFormat::NpyOutputFormat(WriteBuffer & out_, const Block & header_) : IOutputFormat(header_, out_)
 {
     const auto & header = getPort(PortKind::Main).getHeader();
@@ -62,20 +76,13 @@ NpyOutputFormat::NpyOutputFormat(WriteBuffer & out_, const Block & header_) : IO
     if (data_types.size() > 1)
         throw Exception(ErrorCodes::TOO_MANY_COLUMNS, "Expected single column for Npy output format, got {}", data_types.size());
     data_type = data_types[0];
+
+    if (!getNumpyDataType(data_type))
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Type {} is not supported for Npy output format", nested_data_type->getName());
 }
 
-void NpyOutputFormat::initialize(const ColumnPtr & column)
+bool NpyOutputFormat::getNumpyDataType(const DataTypePtr & type)
 {
-    auto type = data_type;
-    ColumnPtr nested_column = column;
-    while (type->getTypeId() == TypeIndex::Array)
-    {
-        const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
-        numpy_shape.push_back(array_column->getOffsets()[0]);
-        type = assert_cast<const DataTypeArray *>(type.get())->getNestedType();
-        nested_column = array_column->getDataPtr();
-    }
-
     switch (type->getTypeId())
     {
         case TypeIndex::Int8: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int8)); break;
@@ -90,65 +97,86 @@ void NpyOutputFormat::initialize(const ColumnPtr & column)
         case TypeIndex::Float64: numpy_data_type = NumpyDataType('<', 'f', sizeof(Float64)); break;
         case TypeIndex::FixedString: numpy_data_type = NumpyDataType('|', 'S', assert_cast<const DataTypeFixedString *>(type.get())->getN()); break;
         case TypeIndex::String: numpy_data_type = NumpyDataType('|', 'S', 0); break;
-        default:
-            has_exception = true;
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Type {} is not supported for Npy output format", type->getName());
+        case TypeIndex::Array: return getNumpyDataType(assert_cast<const DataTypeArray *>(type.get())->getNestedType());
+        default: nested_data_type = type; return false;
     }
+
     nested_data_type = type;
+    return true;
 }
 
 void NpyOutputFormat::consume(Chunk chunk)
 {
-    if (!has_exception)
+    if (!invalid_shape)
     {
         num_rows += chunk.getNumRows();
-        auto column = chunk.getColumns()[0];
+        const auto & column = chunk.getColumns()[0];
 
         if (!is_initialized)
         {
-            initialize(column);
+            initShape(column);
             is_initialized = true;
         }
 
-        /// check shape
-        auto type = data_type;
-        ColumnPtr nested_column = column;
-        int dim = 0;
-        while (type->getTypeId() == TypeIndex::Array)
+        if (!checkShape(column))
         {
-            const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
-            const auto & array_offset = array_column->getOffsets();
-            for (size_t i = 1; i < array_offset.size(); ++i)
-            {
-                if (array_offset[i] - array_offset[i - 1] != numpy_shape[dim])
-                {
-                    has_exception = true;
-                    throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ClickHouse doesn't support object types, cannot format ragged nested sequences (which is a list of arrays with different shapes)");
-                }
-            }
-            type = assert_cast<const DataTypeArray *>(type.get())->getNestedType();
-            nested_column = array_column->getDataPtr();
-            dim++;
+            invalid_shape = true;
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ClickHouse doesn't support object types, cannot format ragged nested sequences (which is a list of arrays with different shapes)");
         }
-
-        /// for type String, get maximum string length
-        if (type->getTypeId() == TypeIndex::String)
-        {
-            const auto & string_offsets = assert_cast<const ColumnString *>(nested_column.get())->getOffsets();
-            for (size_t i = 0; i < string_offsets.size(); ++i)
-            {
-                size_t string_length = static_cast<size_t>(string_offsets[i] - 1 - string_offsets[i - 1]);
-                numpy_data_type.size = numpy_data_type.size > string_length ? numpy_data_type.size : string_length;
-            }
-        }
-
-        columns.push_back(nested_column);
     }
 }
 
+void NpyOutputFormat::initShape(const ColumnPtr & column)
+{
+    auto type = data_type;
+    ColumnPtr nested_column = column;
+    while (type->getTypeId() == TypeIndex::Array)
+    {
+        const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
+
+        numpy_shape.push_back(array_column->getOffsets()[0]);
+
+        type = assert_cast<const DataTypeArray *>(type.get())->getNestedType();
+        nested_column = array_column->getDataPtr();
+    }
+}
+
+bool NpyOutputFormat::checkShape(const ColumnPtr & column)
+{
+    auto type = data_type;
+    ColumnPtr nested_column = column;
+    int dim = 0;
+    while (type->getTypeId() == TypeIndex::Array)
+    {
+        const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
+        const auto & array_offset = array_column->getOffsets();
+
+        for (size_t i = 1; i < array_offset.size(); ++i)
+            if (array_offset[i] - array_offset[i - 1] != numpy_shape[dim])
+                return false;
+
+        type = assert_cast<const DataTypeArray *>(type.get())->getNestedType();
+        nested_column = array_column->getDataPtr();
+        dim += 1;
+    }
+
+    if (type->getTypeId() == TypeIndex::String)
+    {
+        const auto & string_offsets = assert_cast<const ColumnString *>(nested_column.get())->getOffsets();
+        for (size_t i = 0; i < string_offsets.size(); ++i)
+        {
+            size_t string_length = static_cast<size_t>(string_offsets[i] - 1 - string_offsets[i - 1]);
+            numpy_data_type.size = numpy_data_type.size > string_length ? numpy_data_type.size : string_length;
+        }
+    }
+
+    columns.push_back(nested_column);
+    return true;
+}
+
 void NpyOutputFormat::finalizeImpl()
 {
-    if (!has_exception)
+    if (!invalid_shape)
     {
         writeHeader();
         writeColumns();
@@ -157,16 +185,7 @@ void NpyOutputFormat::finalizeImpl()
 
 void NpyOutputFormat::writeHeader()
 {
-    WriteBufferFromOwnString shape;
-    writeIntText(num_rows, shape);
-    writeChar(',', shape);
-    for (auto dim : numpy_shape)
-    {
-        writeIntText(dim, shape);
-        writeChar(',', shape);
-    }
-
-    String dict = "{'descr':'" + numpy_data_type.str() + "','fortran_order':False,'shape':(" + shape.str() + "),}";
+    String dict = "{'descr':'" + numpy_data_type.str() + "','fortran_order':False,'shape':(" + shapeStr() + "),}";
     String padding = "\n";
 
     /// completes the length of the header, which is divisible by 64.
@@ -181,7 +200,7 @@ void NpyOutputFormat::writeHeader()
     }
 
     out.write(STATIC_HEADER, STATIC_HEADER_LENGTH);
-    writeBinaryLittleEndian(assert_cast<UInt32>(dict_length), out);
+    writeBinaryLittleEndian(static_cast<UInt32>(dict_length), out);
     out.write(dict.data(), dict.length());
     out.write(padding.data(), padding.length());
 }
diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.h b/src/Processors/Formats/Impl/NpyOutputFormat.h
index f1d0216a8c3..83fad657b2e 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.h
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.h
@@ -40,14 +40,20 @@ private:
       String str() const;
     };
 
-    void initialize(const ColumnPtr & column);
+    String shapeStr() const;
+
+    bool getNumpyDataType(const DataTypePtr & type);
+
     void consume(Chunk) override;
+    void initShape(const ColumnPtr & column);
+    bool checkShape(const ColumnPtr & column);
+
     void finalizeImpl() override;
     void writeHeader();
     void writeColumns();
 
     bool is_initialized = false;
-    bool has_exception = false;
+    bool invalid_shape = false;
 
     DataTypePtr data_type;
     DataTypePtr nested_data_type;

From 2f6db2ac47d55a1d740463173d2613d895419256 Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Sun, 21 Apr 2024 12:01:31 +0000
Subject: [PATCH 049/289] fix: batter

---
 src/Functions/clamp.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Functions/clamp.cpp b/src/Functions/clamp.cpp
index 0593c6c6b16..3438377afbf 100644
--- a/src/Functions/clamp.cpp
+++ b/src/Functions/clamp.cpp
@@ -42,12 +42,13 @@ public:
         Columns converted_columns(arg_size);
         for (size_t arg = 0; arg < arg_size; ++arg)
             converted_columns[arg] = castColumn(arguments[arg], result_type)->convertToFullColumnIfConst();
-        if (converted_columns[1]->compareAt(0, 0, *converted_columns[2], 1) > 0)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Function {} the minimum value cannot be greater than the maximum value", getName());
 
         auto result_column = result_type->createColumn();
         for (size_t row_num = 0; row_num < input_rows_count; ++row_num)
         {
+            if (converted_columns[1]->compareAt(row_num, row_num, *converted_columns[2], 1) > 0)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Function {} the minimum value cannot be greater than the maximum value", getName());
+
             size_t best_arg = 0;
             if (converted_columns[1]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) > 0)
                 best_arg = 1;

From ab49ab9172dba3c26351b9ab1e417545696a86e8 Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Sun, 21 Apr 2024 12:03:15 +0000
Subject: [PATCH 050/289] test

---
 tests/queries/0_stateless/03036_clamp.reference | 8 ++++++--
 tests/queries/0_stateless/03036_clamp.sql       | 9 +++++++--
 2 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/03036_clamp.reference b/tests/queries/0_stateless/03036_clamp.reference
index 5c8de57794d..b866caf2261 100644
--- a/tests/queries/0_stateless/03036_clamp.reference
+++ b/tests/queries/0_stateless/03036_clamp.reference
@@ -6,5 +6,9 @@ b
 ['hello']
 -1
 234
-null
-null
\ No newline at end of file
+\N
+\N
+5
+0
+1
+2
diff --git a/tests/queries/0_stateless/03036_clamp.sql b/tests/queries/0_stateless/03036_clamp.sql
index e075096f8ef..d225be63f46 100644
--- a/tests/queries/0_stateless/03036_clamp.sql
+++ b/tests/queries/0_stateless/03036_clamp.sql
@@ -2,9 +2,14 @@ SELECT clamp(1, 10, 20);
 SELECT clamp(30, 10, 20);
 SELECT clamp(15, 10, 20);
 SELECT clamp('a', 'b', 'c');
-SELECT clamp(today(), yesterday() - 10, yesterday() + 10) - today()
+SELECT clamp(today(), yesterday() - 10, yesterday() + 10) - today();
 SELECT clamp([], ['hello'], ['world']);
 SELECT clamp(-1., -1000., 18446744073709551615.);
 SELECT clamp(toNullable(123), 234, 456);
 select clamp(1, null, 5);
-select clamp(1, 6, null);
\ No newline at end of file
+select clamp(1, 6, null);
+select clamp(1, 5, nan);
+select clamp(toInt64(number), toInt64(number-1), toInt64(number+1)) from numbers(3);
+select clamp(number, number-1, number+1) from numbers(3);   -- { serverError 386 }
+select clamp(1, 3, 2);   -- { serverError 36 } 
+select clamp(1, data[1], data[2])from (select arrayJoin([[1, 2], [2,3], [3,2], [4, 4]]) as data);   -- { serverError 36 } 

From c7fcc5493cfe5b5b3e2ab884ad1273cbee25c688 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Tue, 23 Apr 2024 11:37:55 +0800
Subject: [PATCH 051/289] fix typo for part log

---
 docs/en/operations/system-tables/part_log.md | 2 +-
 src/Interpreters/PartLog.cpp                 | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/system-tables/part_log.md b/docs/en/operations/system-tables/part_log.md
index af582646653..c0caea1ce5e 100644
--- a/docs/en/operations/system-tables/part_log.md
+++ b/docs/en/operations/system-tables/part_log.md
@@ -14,7 +14,7 @@ The `system.part_log` table contains the following columns:
 - `event_type` ([Enum8](../../sql-reference/data-types/enum.md)) — Type of the event that occurred with the data part. Can have one of the following values:
     - `NewPart` — Inserting of a new data part.
     - `MergeParts` — Merging of data parts.
-    - `DownloadParts` — Downloading a data part.
+    - `DownloadPart` — Downloading a data part.
     - `RemovePart` — Removing or detaching a data part using [DETACH PARTITION](../../sql-reference/statements/alter/partition.md#alter_detach-partition).
     - `MutatePart` — Mutating of a data part.
     - `MovePart` — Moving the data part from the one disk to another one.
diff --git a/src/Interpreters/PartLog.cpp b/src/Interpreters/PartLog.cpp
index 66f933f1afa..db339375231 100644
--- a/src/Interpreters/PartLog.cpp
+++ b/src/Interpreters/PartLog.cpp
@@ -101,7 +101,7 @@ ColumnsDescription PartLogElement::getColumnsDescription()
             "Can have one of the following values: "
             "NewPart — Inserting of a new data part, "
             "MergeParts — Merging of data parts, "
-            "DownloadParts — Downloading a data part, "
+            "DownloadPart — Downloading a data part, "
             "RemovePart — Removing or detaching a data part using DETACH PARTITION, "
             "MutatePart — Mutating of a data part, "
             "MovePart — Moving the data part from the one disk to another one."},

From 1f207de7a10dfc9c9b0ca76f8d62d55da6e04c61 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 24 Apr 2024 16:40:27 +0000
Subject: [PATCH 052/289] Add another case with GROUP BY USE NULLS

---
 ...3023_group_by_use_nulls_analyzer_crashes.reference | 10 ++++++++++
 .../03023_group_by_use_nulls_analyzer_crashes.sql     | 11 +++++++++++
 2 files changed, 21 insertions(+)

diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
index 17a17484a0c..e2682487229 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
@@ -66,3 +66,13 @@ a	a
 a	a
 
 a	a
+0	0
+0	\N
+1	2
+1	\N
+2	4
+2	\N
+\N	0
+\N	2
+\N	4
+\N	\N
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
index 68710137542..f2d4ac8acee 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
@@ -21,3 +21,14 @@ SELECT tuple(number + 1) AS x FROM numbers(10) GROUP BY number + 1, toString(x)
 SELECT tuple(tuple(number)) AS x FROM numbers(10) WHERE toString(toUUID(tuple(number), NULL), x) GROUP BY number, (toString(x), number) WITH CUBE SETTINGS group_by_use_nulls = 1 FORMAT Null;
 
 SELECT  materialize('a'), 'a' AS key GROUP BY key WITH CUBE WITH TOTALS SETTINGS group_by_use_nulls = 1;
+
+EXPLAIN QUERY TREE
+SELECT a, b
+FROM numbers(3)
+GROUP BY number as a, (number + number) as b WITH CUBE
+ORDER BY a, b format Null;
+
+SELECT a, b
+FROM numbers(3)
+GROUP BY number as a, (number + number) as b WITH CUBE
+ORDER BY a, b;

From c9a31599c08f7281acff09b86aa68d7da345efdc Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Wed, 24 Apr 2024 22:14:47 +0000
Subject: [PATCH 053/289] fix single-threading failsafe when number of files
 cannot be estimated

---
 src/Storages/StorageS3.cpp | 25 +++++++++++++++++++++++--
 src/Storages/StorageS3.h   |  1 +
 2 files changed, 24 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index acef213c1f4..daab457e46b 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -229,6 +229,14 @@ public:
         return buffer.size();
     }
 
+    bool hasMore()
+    {
+        if (!buffer.size())
+            return !(expanded_keys_iter == expanded_keys.end() && is_finished_for_key);
+        else
+            return true;
+    }
+
     ~Impl()
     {
         list_objects_pool.wait();
@@ -481,6 +489,11 @@ size_t StorageS3Source::DisclosedGlobIterator::estimatedKeysCount()
     return pimpl->objectsCount();
 }
 
+bool StorageS3Source::DisclosedGlobIterator::hasMore()
+{
+    return pimpl->hasMore();
+}
+
 class StorageS3Source::KeysIterator::Impl
 {
 public:
@@ -1243,8 +1256,16 @@ void ReadFromStorageS3Step::initializePipeline(QueryPipelineBuilder & pipeline,
     if (estimated_keys_count > 1)
         num_streams = std::min(num_streams, estimated_keys_count);
     else
-        /// Disclosed glob iterator can underestimate the amount of keys in some cases. We will keep one stream for this particular case.
-        num_streams = 1;
+    {
+        const auto glob_iter = std::dynamic_pointer_cast<StorageS3Source::DisclosedGlobIterator>(iterator_wrapper);
+        if (!(glob_iter && glob_iter->hasMore()))
+        {
+            /// Disclosed glob iterator can underestimate the amount of keys in some cases. We will keep one stream for this particular case.
+            num_streams = 1;
+        }
+        /// Otherwise, 1000 files were already listed, but none of them is actually what we are looking for.
+        /// We cannot estimate _how many_ there are left, but if there are more files to list, it's faster to do it in many streams.
+    }
 
     const size_t max_threads = context->getSettingsRef().max_threads;
     const size_t max_parsing_threads = num_streams >= max_threads ? 1 : (max_threads / std::max(num_streams, 1ul));
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index 19cbfaa6f08..8d21f1d8e8e 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -83,6 +83,7 @@ public:
 
         KeyWithInfoPtr next(size_t idx = 0) override; /// NOLINT
         size_t estimatedKeysCount() override;
+        bool hasMore();
 
     private:
         class Impl;

From ae17941e63e1f66520ef13616ff0370e83996a4e Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Thu, 25 Apr 2024 15:51:06 +0800
Subject: [PATCH 054/289] add docs

---
 docs/en/interfaces/formats.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index f4b082c57ab..80ca0109f0b 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -75,7 +75,7 @@ The supported formats are:
 | [ArrowStream](#data-format-arrow-stream)                                                  | ✔    | ✔     |
 | [ORC](#data-format-orc)                                                                   | ✔    | ✔     |
 | [One](#data-format-one)                                                                   | ✔    | ✗     |
-| [Npy](#data-format-npy)                                                                   | ✔    | ✗     |
+| [Npy](#data-format-npy)                                                                   | ✔    | ✔     |
 | [RowBinary](#rowbinary)                                                                   | ✔    | ✔     |
 | [RowBinaryWithNames](#rowbinarywithnamesandtypes)                                         | ✔    | ✔     |
 | [RowBinaryWithNamesAndTypes](#rowbinarywithnamesandtypes)                                 | ✔    | ✔     |

From 5e8bc4402ab4df42d228c0474ee01fbb83c97a71 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Thu, 25 Apr 2024 15:52:30 +0800
Subject: [PATCH 055/289] unified NumpyDataTypes

---
 src/Formats/NumpyDataTypes.h                  | 50 ++++++++--
 .../Formats/Impl/NpyOutputFormat.cpp          | 91 ++++++++++++-------
 src/Processors/Formats/Impl/NpyOutputFormat.h | 15 +--
 3 files changed, 99 insertions(+), 57 deletions(-)

diff --git a/src/Formats/NumpyDataTypes.h b/src/Formats/NumpyDataTypes.h
index 712797515c9..5cf2ebf5b40 100644
--- a/src/Formats/NumpyDataTypes.h
+++ b/src/Formats/NumpyDataTypes.h
@@ -1,10 +1,12 @@
 #pragma once
 #include <cstddef>
 #include <Storages/NamedCollectionsHelpers.h>
+#include <IO/WriteBufferFromString.h>
 
 namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
+    extern const int NOT_IMPLEMENTED;
 }
 
 enum class NumpyDataTypeIndex
@@ -29,9 +31,9 @@ class NumpyDataType
 public:
     enum Endianness
     {
-        LITTLE,
-        BIG,
-        NONE,
+        LITTLE = '<',
+        BIG = '>',
+        NONE = '|',
     };
     NumpyDataTypeIndex type_index;
 
@@ -41,15 +43,18 @@ public:
     Endianness getEndianness() const { return endianness; }
 
     virtual NumpyDataTypeIndex getTypeIndex() const = 0;
+    virtual size_t getSize() const { throw DB::Exception(DB::ErrorCodes::NOT_IMPLEMENTED, "Function getSize() is not implemented"); }
+    virtual void setSize(size_t) { throw DB::Exception(DB::ErrorCodes::NOT_IMPLEMENTED, "Function setSize() is not implemented"); }
+    virtual String str() const { throw DB::Exception(DB::ErrorCodes::NOT_IMPLEMENTED, "Function str() is not implemented"); }
 
-private:
+protected:
     Endianness endianness;
 };
 
 class NumpyDataTypeInt : public NumpyDataType
 {
 public:
-    NumpyDataTypeInt(Endianness endianness, size_t size_, bool is_signed_) : NumpyDataType(endianness), size(size_), is_signed(is_signed_)
+    NumpyDataTypeInt(Endianness endianness_, size_t size_, bool is_signed_) : NumpyDataType(endianness_), size(size_), is_signed(is_signed_)
     {
         switch (size)
         {
@@ -67,6 +72,14 @@ public:
         return type_index;
     }
     bool isSigned() const { return is_signed; }
+    String str() const override
+    {
+        DB::WriteBufferFromOwnString buf;
+        writeChar(static_cast<char>(endianness), buf);
+        writeChar(is_signed ? 'i' : 'u', buf);
+        writeIntText(size, buf);
+        return buf.str();
+    }
 
 private:
     size_t size;
@@ -76,7 +89,7 @@ private:
 class NumpyDataTypeFloat : public NumpyDataType
 {
 public:
-    NumpyDataTypeFloat(Endianness endianness, size_t size_) : NumpyDataType(endianness), size(size_)
+    NumpyDataTypeFloat(Endianness endianness_, size_t size_) : NumpyDataType(endianness_), size(size_)
     {
         switch (size)
         {
@@ -92,6 +105,14 @@ public:
     {
         return type_index;
     }
+    String str() const override
+    {
+        DB::WriteBufferFromOwnString buf;
+        writeChar(static_cast<char>(endianness), buf);
+        writeChar('f', buf);
+        writeIntText(size, buf);
+        return buf.str();
+    }
 private:
     size_t size;
 };
@@ -99,13 +120,22 @@ private:
 class NumpyDataTypeString : public NumpyDataType
 {
 public:
-    NumpyDataTypeString(Endianness endianness, size_t size_) : NumpyDataType(endianness), size(size_)
+    NumpyDataTypeString(Endianness endianness_, size_t size_) : NumpyDataType(endianness_), size(size_)
     {
         type_index = NumpyDataTypeIndex::String;
     }
 
     NumpyDataTypeIndex getTypeIndex() const override { return type_index; }
-    size_t getSize() const { return size; }
+    size_t getSize() const override { return size; }
+    void setSize(size_t size_) override { size = size_; }
+    String str() const override
+    {
+        DB::WriteBufferFromOwnString buf;
+        writeChar(static_cast<char>(endianness), buf);
+        writeChar('S', buf);
+        writeIntText(size, buf);
+        return buf.str();
+    }
 private:
     size_t size;
 };
@@ -113,13 +143,13 @@ private:
 class NumpyDataTypeUnicode : public NumpyDataType
 {
 public:
-    NumpyDataTypeUnicode(Endianness endianness, size_t size_) : NumpyDataType(endianness), size(size_)
+    NumpyDataTypeUnicode(Endianness endianness_, size_t size_) : NumpyDataType(endianness_), size(size_)
     {
         type_index = NumpyDataTypeIndex::Unicode;
     }
 
     NumpyDataTypeIndex getTypeIndex() const override { return type_index; }
-    size_t getSize() const { return size * 4; }
+    size_t getSize() const override { return size * 4; }
 private:
     size_t size;
 };
diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
index d54fc7e68f2..64272307e9d 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -45,16 +45,6 @@ void writeNumpyStrings(const ColumnPtr & column, size_t length, WriteBuffer & bu
 
 }
 
-String NpyOutputFormat::NumpyDataType::str() const
-{
-    WriteBufferFromOwnString dtype;
-    writeChar(endianness, dtype);
-    writeChar(type, dtype);
-    writeIntText(size, dtype);
-
-    return dtype.str();
-}
-
 String NpyOutputFormat::shapeStr() const
 {
     WriteBufferFromOwnString shape;
@@ -85,20 +75,48 @@ bool NpyOutputFormat::getNumpyDataType(const DataTypePtr & type)
 {
     switch (type->getTypeId())
     {
-        case TypeIndex::Int8: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int8)); break;
-        case TypeIndex::Int16: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int16)); break;
-        case TypeIndex::Int32: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int32)); break;
-        case TypeIndex::Int64: numpy_data_type = NumpyDataType('<', 'i', sizeof(Int64)); break;
-        case TypeIndex::UInt8: numpy_data_type = NumpyDataType('<', 'u', sizeof(UInt8)); break;
-        case TypeIndex::UInt16: numpy_data_type = NumpyDataType('<', 'u', sizeof(UInt16)); break;
-        case TypeIndex::UInt32: numpy_data_type = NumpyDataType('<', 'u', sizeof(UInt32)); break;
-        case TypeIndex::UInt64: numpy_data_type = NumpyDataType('<', 'u', sizeof(UInt64)); break;
-        case TypeIndex::Float32: numpy_data_type = NumpyDataType('<', 'f', sizeof(Float32)); break;
-        case TypeIndex::Float64: numpy_data_type = NumpyDataType('<', 'f', sizeof(Float64)); break;
-        case TypeIndex::FixedString: numpy_data_type = NumpyDataType('|', 'S', assert_cast<const DataTypeFixedString *>(type.get())->getN()); break;
-        case TypeIndex::String: numpy_data_type = NumpyDataType('|', 'S', 0); break;
-        case TypeIndex::Array: return getNumpyDataType(assert_cast<const DataTypeArray *>(type.get())->getNestedType());
-        default: nested_data_type = type; return false;
+        case TypeIndex::Int8:
+            numpy_data_type = std::make_shared<NumpyDataTypeInt>(NumpyDataType::Endianness::LITTLE, sizeof(Int8), true);
+            break;
+        case TypeIndex::Int16:
+            numpy_data_type = std::make_shared<NumpyDataTypeInt>(NumpyDataType::Endianness::LITTLE, sizeof(Int16), true);
+            break;
+        case TypeIndex::Int32:
+            numpy_data_type = std::make_shared<NumpyDataTypeInt>(NumpyDataType::Endianness::LITTLE, sizeof(Int32), true);
+            break;
+        case TypeIndex::Int64:
+            numpy_data_type = std::make_shared<NumpyDataTypeInt>(NumpyDataType::Endianness::LITTLE, sizeof(Int64), true);
+            break;
+        case TypeIndex::UInt8:
+            numpy_data_type = std::make_shared<NumpyDataTypeInt>(NumpyDataType::Endianness::LITTLE, sizeof(UInt8), false);
+            break;
+        case TypeIndex::UInt16:
+            numpy_data_type = std::make_shared<NumpyDataTypeInt>(NumpyDataType::Endianness::LITTLE, sizeof(UInt16), false);
+            break;
+        case TypeIndex::UInt32:
+            numpy_data_type = std::make_shared<NumpyDataTypeInt>(NumpyDataType::Endianness::LITTLE, sizeof(UInt32), false);
+            break;
+        case TypeIndex::UInt64:
+            numpy_data_type = std::make_shared<NumpyDataTypeInt>(NumpyDataType::Endianness::LITTLE, sizeof(UInt64), false);
+            break;
+        case TypeIndex::Float32:
+            numpy_data_type = std::make_shared<NumpyDataTypeFloat>(NumpyDataType::Endianness::LITTLE, sizeof(Float32));
+            break;
+        case TypeIndex::Float64:
+            numpy_data_type = std::make_shared<NumpyDataTypeFloat>(NumpyDataType::Endianness::LITTLE, sizeof(Float64));
+            break;
+        case TypeIndex::FixedString:
+            numpy_data_type = std::make_shared<NumpyDataTypeString>(
+                NumpyDataType::Endianness::NONE, assert_cast<const DataTypeFixedString *>(type.get())->getN());
+            break;
+        case TypeIndex::String:
+            numpy_data_type = std::make_shared<NumpyDataTypeString>(NumpyDataType::Endianness::NONE, 0);
+            break;
+        case TypeIndex::Array:
+            return getNumpyDataType(assert_cast<const DataTypeArray *>(type.get())->getNestedType());
+        default:
+            nested_data_type = type;
+            return false;
     }
 
     nested_data_type = type;
@@ -117,6 +135,9 @@ void NpyOutputFormat::consume(Chunk chunk)
             initShape(column);
             is_initialized = true;
         }
+        // ColumnPtr checkShape, if nullptr?
+        // updateSizeIfTypeString
+        // columns.push_back()
 
         if (!checkShape(column))
         {
@@ -130,13 +151,9 @@ void NpyOutputFormat::initShape(const ColumnPtr & column)
 {
     auto type = data_type;
     ColumnPtr nested_column = column;
-    while (type->getTypeId() == TypeIndex::Array)
+    while (const auto * array_column = typeid_cast<const ColumnArray *>(nested_column.get()))
     {
-        const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
-
         numpy_shape.push_back(array_column->getOffsets()[0]);
-
-        type = assert_cast<const DataTypeArray *>(type.get())->getNestedType();
         nested_column = array_column->getDataPtr();
     }
 }
@@ -166,7 +183,8 @@ bool NpyOutputFormat::checkShape(const ColumnPtr & column)
         for (size_t i = 0; i < string_offsets.size(); ++i)
         {
             size_t string_length = static_cast<size_t>(string_offsets[i] - 1 - string_offsets[i - 1]);
-            numpy_data_type.size = numpy_data_type.size > string_length ? numpy_data_type.size : string_length;
+            if (numpy_data_type->getSize() < string_length)
+                numpy_data_type->setSize(string_length);
         }
     }
 
@@ -185,7 +203,7 @@ void NpyOutputFormat::finalizeImpl()
 
 void NpyOutputFormat::writeHeader()
 {
-    String dict = "{'descr':'" + numpy_data_type.str() + "','fortran_order':False,'shape':(" + shapeStr() + "),}";
+    String dict = "{'descr':'" + numpy_data_type->str() + "','fortran_order':False,'shape':(" + shapeStr() + "),}";
     String padding = "\n";
 
     /// completes the length of the header, which is divisible by 64.
@@ -221,9 +239,14 @@ void NpyOutputFormat::writeColumns()
             case TypeIndex::UInt64: writeNumpyNumbers<ColumnUInt64, UInt64>(column, out); break;
             case TypeIndex::Float32: writeNumpyNumbers<ColumnFloat32, Float32>(column, out); break;
             case TypeIndex::Float64: writeNumpyNumbers<ColumnFloat64, Float64>(column, out); break;
-            case TypeIndex::FixedString: writeNumpyStrings<ColumnFixedString>(column, numpy_data_type.size, out); break;
-            case TypeIndex::String: writeNumpyStrings<ColumnString>(column, numpy_data_type.size, out); break;
-            default: break;
+            case TypeIndex::FixedString:
+                writeNumpyStrings<ColumnFixedString>(column, numpy_data_type->getSize(), out);
+                break;
+            case TypeIndex::String:
+                writeNumpyStrings<ColumnString>(column, numpy_data_type->getSize(), out);
+                break;
+            default:
+                break;
         }
     }
 }
diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.h b/src/Processors/Formats/Impl/NpyOutputFormat.h
index 83fad657b2e..6859cf10e69 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.h
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.h
@@ -5,6 +5,7 @@
 #include <IO/WriteBufferFromVector.h>
 #include <Processors/Formats/IRowOutputFormat.h>
 #include <Formats/FormatSettings.h>
+#include <Formats/NumpyDataTypes.h>
 #include <Columns/IColumn.h>
 #include <Common/PODArray_fwd.h>
 
@@ -28,18 +29,6 @@ public:
     String getContentType() const override { return "application/octet-stream"; }
 
 private:
-    struct NumpyDataType
-    {
-      char endianness;
-      char type;
-      size_t size;
-
-      NumpyDataType() = default;
-      NumpyDataType(char endianness_, char type_, size_t size_)
-        : endianness(endianness_), type(type_), size(size_) {}
-      String str() const;
-    };
-
     String shapeStr() const;
 
     bool getNumpyDataType(const DataTypePtr & type);
@@ -57,7 +46,7 @@ private:
 
     DataTypePtr data_type;
     DataTypePtr nested_data_type;
-    NumpyDataType numpy_data_type;
+    std::shared_ptr<NumpyDataType> numpy_data_type;
     UInt64 num_rows = 0;
     std::vector<UInt64> numpy_shape;
     Columns columns;

From 686ea6af9c3512c7b07345cabc785bb975311162 Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Thu, 25 Apr 2024 09:06:49 +0000
Subject: [PATCH 056/289] fix style and logic of estimation

---
 src/Storages/StorageS3.cpp | 20 +++++++++++---------
 1 file changed, 11 insertions(+), 9 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 6ba41d21766..bdfd2b8b453 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -231,7 +231,7 @@ public:
 
     bool hasMore()
     {
-        if (!buffer.size())
+        if (buffer.empty())
             return !(expanded_keys_iter == expanded_keys.end() && is_finished_for_key);
         else
             return true;
@@ -1286,19 +1286,21 @@ void ReadFromStorageS3Step::initializePipeline(QueryPipelineBuilder & pipeline,
     createIterator(nullptr);
 
     size_t estimated_keys_count = iterator_wrapper->estimatedKeysCount();
-    if (estimated_keys_count > 1)
-        num_streams = std::min(num_streams, estimated_keys_count);
-    else
+    const auto glob_iter = std::dynamic_pointer_cast<StorageS3Source::DisclosedGlobIterator>(iterator_wrapper);
+
+    if (!(glob_iter && glob_iter->hasMore()))
     {
-        const auto glob_iter = std::dynamic_pointer_cast<StorageS3Source::DisclosedGlobIterator>(iterator_wrapper);
-        if (!(glob_iter && glob_iter->hasMore()))
+        if (estimated_keys_count > 1)
+            num_streams = std::min(num_streams, estimated_keys_count);
+        else
         {
-            /// Disclosed glob iterator can underestimate the amount of keys in some cases. We will keep one stream for this particular case.
+            /// The amount of keys (zero) was probably underestimated. We will keep one stream for this particular case.
             num_streams = 1;
         }
-        /// Otherwise, 1000 files were already listed, but none of them is actually what we are looking for.
-        /// We cannot estimate _how many_ there are left, but if there are more files to list, it's faster to do it in many streams.
     }
+     /// OTHERWISE, 1000 files were listed, but we cannot make any estimation of _how many_ there are (because we list bucket lazily);
+     /// If there are more objects in the bucket, limiting the number of streams is the last thing we may want to do
+     /// as it would lead to serious (up to <max_threads> times) reading performance degradation.
 
     const size_t max_threads = context->getSettingsRef().max_threads;
     const size_t max_parsing_threads = num_streams >= max_threads ? 1 : (max_threads / std::max(num_streams, 1ul));

From d3d7d3575db1f0d76f4a910c1bc30faf911cf839 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Thu, 25 Apr 2024 17:16:11 +0800
Subject: [PATCH 057/289] fix empty array & refactor

---
 .../Formats/Impl/NpyOutputFormat.cpp          |  45 +++++++++---------
 src/Processors/Formats/Impl/NpyOutputFormat.h |   3 +-
 .../02895_npy_output_format.reference         | Bin 626 -> 1010 bytes
 .../0_stateless/02895_npy_output_format.sh    |   6 ++-
 4 files changed, 28 insertions(+), 26 deletions(-)

diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
index 64272307e9d..f031b776ff7 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -135,51 +135,53 @@ void NpyOutputFormat::consume(Chunk chunk)
             initShape(column);
             is_initialized = true;
         }
-        // ColumnPtr checkShape, if nullptr?
-        // updateSizeIfTypeString
-        // columns.push_back()
 
-        if (!checkShape(column))
-        {
-            invalid_shape = true;
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ClickHouse doesn't support object types, cannot format ragged nested sequences (which is a list of arrays with different shapes)");
-        }
+        ColumnPtr nested_column = column;
+        checkShape(nested_column);
+        updateSizeIfTypeString(nested_column);
+        columns.push_back(nested_column);
     }
 }
 
 void NpyOutputFormat::initShape(const ColumnPtr & column)
 {
-    auto type = data_type;
     ColumnPtr nested_column = column;
     while (const auto * array_column = typeid_cast<const ColumnArray *>(nested_column.get()))
     {
-        numpy_shape.push_back(array_column->getOffsets()[0]);
+        auto dim = array_column->getOffsets()[0];
+        invalid_shape = dim == 0;
+        numpy_shape.push_back(dim);
         nested_column = array_column->getDataPtr();
     }
+
+    if (invalid_shape)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Shape ({}) is an invalid shape, as dimension size cannot be 0", shapeStr());
 }
 
-bool NpyOutputFormat::checkShape(const ColumnPtr & column)
+void NpyOutputFormat::checkShape(ColumnPtr & column)
 {
-    auto type = data_type;
-    ColumnPtr nested_column = column;
     int dim = 0;
-    while (type->getTypeId() == TypeIndex::Array)
+    while (const auto * array_column = typeid_cast<const ColumnArray *>(column.get()))
     {
-        const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
         const auto & array_offset = array_column->getOffsets();
 
         for (size_t i = 1; i < array_offset.size(); ++i)
             if (array_offset[i] - array_offset[i - 1] != numpy_shape[dim])
-                return false;
+            {
+                invalid_shape = true;
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ClickHouse doesn't support object types, cannot format ragged nested sequences (which is a list of arrays with different shapes)");
+            }
 
-        type = assert_cast<const DataTypeArray *>(type.get())->getNestedType();
-        nested_column = array_column->getDataPtr();
+        column = array_column->getDataPtr();
         dim += 1;
     }
+}
 
-    if (type->getTypeId() == TypeIndex::String)
+void NpyOutputFormat::updateSizeIfTypeString(const ColumnPtr & column)
+{
+    if (nested_data_type->getTypeId() == TypeIndex::String)
     {
-        const auto & string_offsets = assert_cast<const ColumnString *>(nested_column.get())->getOffsets();
+        const auto & string_offsets = assert_cast<const ColumnString *>(column.get())->getOffsets();
         for (size_t i = 0; i < string_offsets.size(); ++i)
         {
             size_t string_length = static_cast<size_t>(string_offsets[i] - 1 - string_offsets[i - 1]);
@@ -187,9 +189,6 @@ bool NpyOutputFormat::checkShape(const ColumnPtr & column)
                 numpy_data_type->setSize(string_length);
         }
     }
-
-    columns.push_back(nested_column);
-    return true;
 }
 
 void NpyOutputFormat::finalizeImpl()
diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.h b/src/Processors/Formats/Impl/NpyOutputFormat.h
index 6859cf10e69..5dd6552ac0c 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.h
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.h
@@ -35,7 +35,8 @@ private:
 
     void consume(Chunk) override;
     void initShape(const ColumnPtr & column);
-    bool checkShape(const ColumnPtr & column);
+    void checkShape(ColumnPtr & column);
+    void updateSizeIfTypeString(const ColumnPtr & column);
 
     void finalizeImpl() override;
     void writeHeader();
diff --git a/tests/queries/0_stateless/02895_npy_output_format.reference b/tests/queries/0_stateless/02895_npy_output_format.reference
index b599f1dceeaabbd60cb66d02ab02a5d1a30c97f2..590c0581ac112679dea10b0c431dd1b69fae4ab6 100644
GIT binary patch
literal 1010
zcmdNj<kBUC47spF13g171U3M1U_@R)B^NfFSX7i)$?2I_V!;UlTyVaj8Jd8x5t@LR
z39>*ax)~q=R6{@_sHT8KP>pfR$xlR61QtS76<ku3nU{`iJ+jDTzfj+RNM?o-1_p*|
z^_0}&<RWz|b(>5RbshDz{GyVg#Ju?YqLfsis9R!AajK4baYkZ6s=Aeiv5pZCYU<P~
zPyo1ww*3Ya`#(B5+Avlp+9(!CL>mJMli1i;F49DS$rz~7Ko4jLP$xc~dSX%%Fk+LE
ylGTAa)RU8wfxHwTPzP(JL>iJA96?z`1DOORbxlo8<n)Iu4Nb7P6+jXzOdbF!74NeE

delta 16
Ycmeyw{)uISGvnm<OcI-KGl??-06dijC;$Ke

diff --git a/tests/queries/0_stateless/02895_npy_output_format.sh b/tests/queries/0_stateless/02895_npy_output_format.sh
index 27274f6a925..aaf58fe26f6 100755
--- a/tests/queries/0_stateless/02895_npy_output_format.sh
+++ b/tests/queries/0_stateless/02895_npy_output_format.sh
@@ -82,15 +82,17 @@ ${CLICKHOUSE_CLIENT} -n -q "
         s Array(Array(String)),
         unknow Array(Int128),
         ragged_1 Array(Array(Int32)),
-        ragged_2 Array(Array(Int32))
+        ragged_2 Array(Array(Int32)),
+        empty Array(Array(Int32))
     ) Engine = MergeTree ORDER BY i4;
 
-    INSERT INTO npy_output_02895.nested VALUES ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2], [3, 4]], [[1, 2], [3]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2, 3], [4]], [[1, 2], [3]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1], [2, 3, 4]], [[1, 2], [3]]);
+    INSERT INTO npy_output_02895.nested VALUES ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2], [3, 4]], [[1, 2], [3]], [[],[]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2, 3], [4]], [[1, 2], [3]], [[],[]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1], [2, 3, 4]], [[1, 2], [3]], [[],[]]);
 
     SELECT * FROM npy_output_02895.nested FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }
     SELECT unknow FROM npy_output_02895.nested FORMAT Npy; -- { clientError BAD_ARGUMENTS }
     SELECT ragged_1 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
     SELECT ragged_2 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
+    SELECT empty FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
 
     INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy') SELECT i4 FROM npy_output_02895.nested;
     INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy') SELECT f8 FROM npy_output_02895.nested;

From 87b35446e36f1b48afa66bb90e44eeff0628f113 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E8=B1=AA=E8=82=A5=E8=82=A5?= <howepa@foxmail.com>
Date: Thu, 25 Apr 2024 17:17:35 +0800
Subject: [PATCH 058/289] unified array travel

Co-authored-by: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
---
 src/Processors/Formats/Impl/NpyOutputFormat.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
index d54fc7e68f2..64bc916da51 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -151,7 +151,7 @@ bool NpyOutputFormat::checkShape(const ColumnPtr & column)
         const auto * array_column = assert_cast<const ColumnArray *>(nested_column.get());
         const auto & array_offset = array_column->getOffsets();
 
-        for (size_t i = 1; i < array_offset.size(); ++i)
+        for (size_t i = 0; i < array_offset.size(); ++i)
             if (array_offset[i] - array_offset[i - 1] != numpy_shape[dim])
                 return false;
 

From d85f6ae35d64cd8f40a5cfb05aa53d60af48955e Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Thu, 25 Apr 2024 17:31:18 +0800
Subject: [PATCH 059/289] reset test

---
 .../Formats/Impl/NpyOutputFormat.cpp           |   2 +-
 .../02895_npy_output_format.reference          | Bin 1010 -> 626 bytes
 2 files changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
index f67c91540e4..b3d5042aa79 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -155,7 +155,7 @@ void NpyOutputFormat::initShape(const ColumnPtr & column)
     }
 
     if (invalid_shape)
-        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Shape ({}) is an invalid shape, as dimension size cannot be 0", shapeStr());
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Shape ({}) is invalid, as dimension size cannot be 0", shapeStr());
 }
 
 void NpyOutputFormat::checkShape(ColumnPtr & column)
diff --git a/tests/queries/0_stateless/02895_npy_output_format.reference b/tests/queries/0_stateless/02895_npy_output_format.reference
index 590c0581ac112679dea10b0c431dd1b69fae4ab6..b599f1dceeaabbd60cb66d02ab02a5d1a30c97f2 100644
GIT binary patch
delta 16
Ycmeyw{)uISGvnm<OcI-KGl??-06dijC;$Ke

literal 1010
zcmdNj<kBUC47spF13g171U3M1U_@R)B^NfFSX7i)$?2I_V!;UlTyVaj8Jd8x5t@LR
z39>*ax)~q=R6{@_sHT8KP>pfR$xlR61QtS76<ku3nU{`iJ+jDTzfj+RNM?o-1_p*|
z^_0}&<RWz|b(>5RbshDz{GyVg#Ju?YqLfsis9R!AajK4baYkZ6s=Aeiv5pZCYU<P~
zPyo1ww*3Ya`#(B5+Avlp+9(!CL>mJMli1i;F49DS$rz~7Ko4jLP$xc~dSX%%Fk+LE
ylGTAa)RU8wfxHwTPzP(JL>iJA96?z`1DOORbxlo8<n)Iu4Nb7P6+jXzOdbF!74NeE


From 382e4fba5c98f3d647356791d2e4e4c8da57f802 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Gr=C3=A9goire=20Pineau?= <lyrixx@lyrixx.info>
Date: Wed, 24 Apr 2024 11:04:56 +0200
Subject: [PATCH 060/289] dx: Enhance error message when non-deterministic
 function is used with Replicated source

---
 src/Interpreters/MutationsInterpreter.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index 35fd549559b..667a3e2e7a6 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -1313,7 +1313,7 @@ void MutationsInterpreter::validate()
 
             if (nondeterministic_func_data.nondeterministic_function_name)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                    "ALTER UPDATE/ALTER DELETE statements must use only deterministic functions. "
+                    "The source storage is replicated so ALTER UPDATE/ALTER DELETE statements must use only deterministic functions. "
                     "Function '{}' is non-deterministic", *nondeterministic_func_data.nondeterministic_function_name);
         }
     }

From b13c7d004c6f533a1931eb8ac5c529ca82914cd9 Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Thu, 25 Apr 2024 14:51:44 +0000
Subject: [PATCH 061/289] fix tidy

---
 src/Storages/StorageS3.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index bdfd2b8b453..cb5734cfe0c 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -278,7 +278,6 @@ private:
 
         filter_dag = VirtualColumnUtils::createPathAndFileFilterDAG(predicate, virtual_columns);
         fillInternalBufferAssumeLocked();
-        return;
     }
 
     KeyWithInfoPtr nextAssumeLocked()

From 34dd0a229f04f3b7f8b3181ced3be6430c0f1d2c Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Thu, 25 Apr 2024 15:46:29 +0000
Subject: [PATCH 062/289] Another one case of aliases with group_by_use_null

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 87 ++++++++++++-------
 ...up_by_use_nulls_analyzer_crashes.reference | 10 +++
 ...23_group_by_use_nulls_analyzer_crashes.sql | 11 +++
 3 files changed, 76 insertions(+), 32 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index aedf860f5be..13ce3d7f0e2 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -474,7 +474,7 @@ struct TableExpressionData
 class ExpressionsStack
 {
 public:
-    void pushNode(const QueryTreeNodePtr & node)
+    void push(const QueryTreeNodePtr & node)
     {
         if (node->hasAlias())
         {
@@ -491,7 +491,7 @@ public:
         expressions.emplace_back(node);
     }
 
-    void popNode()
+    void pop()
     {
         const auto & top_expression = expressions.back();
         const auto & top_expression_alias = top_expression->getAlias();
@@ -729,6 +729,8 @@ struct IdentifierResolveScope
             join_use_nulls = context->getSettingsRef().join_use_nulls;
         else if (parent_scope)
             join_use_nulls = parent_scope->join_use_nulls;
+
+        alias_name_to_expression_node = &alias_name_to_expression_node_before_group_by;
     }
 
     QueryTreeNodePtr scope_node;
@@ -744,7 +746,10 @@ struct IdentifierResolveScope
     std::unordered_map<std::string, QueryTreeNodePtr> expression_argument_name_to_node;
 
     /// Alias name to query expression node
-    std::unordered_map<std::string, QueryTreeNodePtr> alias_name_to_expression_node;
+    std::unordered_map<std::string, QueryTreeNodePtr> alias_name_to_expression_node_before_group_by;
+    std::unordered_map<std::string, QueryTreeNodePtr> alias_name_to_expression_node_after_group_by;
+
+    std::unordered_map<std::string, QueryTreeNodePtr> * alias_name_to_expression_node = nullptr;
 
     /// Alias name to lambda node
     std::unordered_map<std::string, QueryTreeNodePtr> alias_name_to_lambda_node;
@@ -877,6 +882,22 @@ struct IdentifierResolveScope
         return it->second;
     }
 
+    void pushExpressionNode(const QueryTreeNodePtr & node)
+    {
+        bool had_aggregate_function = expressions_in_resolve_process_stack.hasAggregateFunction();
+        expressions_in_resolve_process_stack.push(node);
+        if (group_by_use_nulls && had_aggregate_function != expressions_in_resolve_process_stack.hasAggregateFunction())
+            alias_name_to_expression_node = &alias_name_to_expression_node_before_group_by;
+    }
+
+    void popExpressionNode()
+    {
+        bool had_aggregate_function = expressions_in_resolve_process_stack.hasAggregateFunction();
+        expressions_in_resolve_process_stack.pop();
+        if (group_by_use_nulls && had_aggregate_function != expressions_in_resolve_process_stack.hasAggregateFunction())
+            alias_name_to_expression_node = &alias_name_to_expression_node_after_group_by;
+    }
+
     /// Dump identifier resolve scope
     [[maybe_unused]] void dump(WriteBuffer & buffer) const
     {
@@ -893,8 +914,8 @@ struct IdentifierResolveScope
         for (const auto & [alias_name, node] : expression_argument_name_to_node)
             buffer << "Alias name " << alias_name << " node " << node->formatASTForErrorMessage() << '\n';
 
-        buffer << "Alias name to expression node table size " << alias_name_to_expression_node.size() << '\n';
-        for (const auto & [alias_name, node] : alias_name_to_expression_node)
+        buffer << "Alias name to expression node table size " << alias_name_to_expression_node->size() << '\n';
+        for (const auto & [alias_name, node] : *alias_name_to_expression_node)
             buffer << "Alias name " << alias_name << " expression node " << node->dumpTree() << '\n';
 
         buffer << "Alias name to function node table size " << alias_name_to_lambda_node.size() << '\n';
@@ -1022,7 +1043,7 @@ private:
 
         if (is_lambda_node)
         {
-            if (scope.alias_name_to_expression_node.contains(alias))
+            if (scope.alias_name_to_expression_node->contains(alias))
                 scope.nodes_with_duplicated_aliases.insert(node);
 
             auto [_, inserted] = scope.alias_name_to_lambda_node.insert(std::make_pair(alias, node));
@@ -1035,7 +1056,7 @@ private:
         if (scope.alias_name_to_lambda_node.contains(alias))
             scope.nodes_with_duplicated_aliases.insert(node);
 
-        auto [_, inserted] = scope.alias_name_to_expression_node.insert(std::make_pair(alias, node));
+        auto [_, inserted] = scope.alias_name_to_expression_node->insert(std::make_pair(alias, node));
         if (!inserted)
             scope.nodes_with_duplicated_aliases.insert(node);
 
@@ -1837,7 +1858,7 @@ void QueryAnalyzer::collectScopeValidIdentifiersForTypoCorrection(
 
     if (allow_expression_identifiers)
     {
-        for (const auto & [name, expression] : scope.alias_name_to_expression_node)
+        for (const auto & [name, expression] : *scope.alias_name_to_expression_node)
         {
             assert(expression);
             auto expression_identifier = Identifier(name);
@@ -1867,7 +1888,7 @@ void QueryAnalyzer::collectScopeValidIdentifiersForTypoCorrection(
     {
         if (allow_function_identifiers)
         {
-            for (const auto & [name, _] : scope.alias_name_to_expression_node)
+            for (const auto & [name, _] : *scope.alias_name_to_expression_node)
                 valid_identifiers_result.insert(Identifier(name));
         }
 
@@ -2767,7 +2788,7 @@ bool QueryAnalyzer::tryBindIdentifierToAliases(const IdentifierLookup & identifi
     auto get_alias_name_to_node_map = [&]() -> const std::unordered_map<std::string, QueryTreeNodePtr> &
     {
         if (identifier_lookup.isExpressionLookup())
-            return scope.alias_name_to_expression_node;
+            return *scope.alias_name_to_expression_node;
         else if (identifier_lookup.isFunctionLookup())
             return scope.alias_name_to_lambda_node;
 
@@ -2829,7 +2850,7 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromAliases(const Identifier
     auto get_alias_name_to_node_map = [&]() -> std::unordered_map<std::string, QueryTreeNodePtr> &
     {
         if (identifier_lookup.isExpressionLookup())
-            return scope.alias_name_to_expression_node;
+            return *scope.alias_name_to_expression_node;
         else if (identifier_lookup.isFunctionLookup())
             return scope.alias_name_to_lambda_node;
 
@@ -2867,7 +2888,7 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromAliases(const Identifier
     /// Resolve expression if necessary
     if (node_type == QueryTreeNodeType::IDENTIFIER)
     {
-        scope.expressions_in_resolve_process_stack.pushNode(it->second);
+        scope.pushExpressionNode(it->second);
 
         auto & alias_identifier_node = it->second->as<IdentifierNode &>();
         auto identifier = alias_identifier_node.getIdentifier();
@@ -2898,9 +2919,9 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromAliases(const Identifier
         if (identifier_lookup.isExpressionLookup())
             scope.alias_name_to_lambda_node.erase(identifier_bind_part);
         else if (identifier_lookup.isFunctionLookup())
-            scope.alias_name_to_expression_node.erase(identifier_bind_part);
+            scope.alias_name_to_expression_node->erase(identifier_bind_part);
 
-        scope.expressions_in_resolve_process_stack.popNode();
+        scope.popExpressionNode();
     }
     else if (node_type == QueryTreeNodeType::FUNCTION)
     {
@@ -5195,7 +5216,7 @@ ProjectionNames QueryAnalyzer::resolveLambda(const QueryTreeNodePtr & lambda_nod
         auto & lambda_argument_node_typed = lambda_argument_node->as<IdentifierNode &>();
         const auto & lambda_argument_name = lambda_argument_node_typed.getIdentifier().getFullName();
 
-        bool has_expression_node = scope.alias_name_to_expression_node.contains(lambda_argument_name);
+        bool has_expression_node = scope.alias_name_to_expression_node->contains(lambda_argument_name);
         bool has_alias_node = scope.alias_name_to_lambda_node.contains(lambda_argument_name);
 
         if (has_expression_node || has_alias_node)
@@ -6200,8 +6221,8 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
           *
           * To resolve b we need to resolve a.
           */
-        auto it = scope.alias_name_to_expression_node.find(node_alias);
-        if (it != scope.alias_name_to_expression_node.end())
+        auto it = scope.alias_name_to_expression_node->find(node_alias);
+        if (it != scope.alias_name_to_expression_node->end())
             node = it->second;
 
         if (allow_lambda_expression)
@@ -6212,7 +6233,7 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
         }
     }
 
-    scope.expressions_in_resolve_process_stack.pushNode(node);
+    scope.pushExpressionNode(node);
 
     auto node_type = node->getNodeType();
 
@@ -6241,7 +6262,7 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
                 resolved_identifier_node = tryResolveIdentifier({unresolved_identifier, IdentifierLookupContext::FUNCTION}, scope).resolved_identifier;
 
                 if (resolved_identifier_node && !node_alias.empty())
-                    scope.alias_name_to_expression_node.erase(node_alias);
+                    scope.alias_name_to_expression_node->erase(node_alias);
             }
 
             if (!resolved_identifier_node && allow_table_expression)
@@ -6472,8 +6493,8 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
       */
     if (!node_alias.empty() && use_alias_table && !scope.group_by_use_nulls)
     {
-        auto it = scope.alias_name_to_expression_node.find(node_alias);
-        if (it != scope.alias_name_to_expression_node.end())
+        auto it = scope.alias_name_to_expression_node->find(node_alias);
+        if (it != scope.alias_name_to_expression_node->end())
             it->second = node;
 
         if (allow_lambda_expression)
@@ -6486,7 +6507,7 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
 
     resolved_expressions.emplace(node, result_projection_names);
 
-    scope.expressions_in_resolve_process_stack.popNode();
+    scope.popExpressionNode();
     bool expression_was_root = scope.expressions_in_resolve_process_stack.empty();
     if (expression_was_root)
         scope.non_cached_identifier_lookups_during_expression_resolve.clear();
@@ -6830,11 +6851,11 @@ void QueryAnalyzer::initializeQueryJoinTreeNode(QueryTreeNodePtr & join_tree_nod
                   */
                 resolve_settings.allow_to_resolve_subquery_during_identifier_resolution = false;
 
-                scope.expressions_in_resolve_process_stack.pushNode(current_join_tree_node);
+                scope.pushExpressionNode(current_join_tree_node);
 
                 auto table_identifier_resolve_result = tryResolveIdentifier(table_identifier_lookup, scope, resolve_settings);
 
-                scope.expressions_in_resolve_process_stack.popNode();
+                scope.popExpressionNode();
                 bool expression_was_root = scope.expressions_in_resolve_process_stack.empty();
                 if (expression_was_root)
                     scope.non_cached_identifier_lookups_during_expression_resolve.clear();
@@ -7418,7 +7439,7 @@ void QueryAnalyzer::resolveArrayJoin(QueryTreeNodePtr & array_join_node, Identif
     for (auto & array_join_expression : array_join_nodes)
     {
         auto array_join_expression_alias = array_join_expression->getAlias();
-        if (!array_join_expression_alias.empty() && scope.alias_name_to_expression_node.contains(array_join_expression_alias))
+        if (!array_join_expression_alias.empty() && scope.alias_name_to_expression_node->contains(array_join_expression_alias))
             throw Exception(ErrorCodes::MULTIPLE_EXPRESSIONS_FOR_ALIAS,
                 "ARRAY JOIN expression {} with duplicate alias {}. In scope {}",
                 array_join_expression->formatASTForErrorMessage(),
@@ -7512,8 +7533,8 @@ void QueryAnalyzer::resolveArrayJoin(QueryTreeNodePtr & array_join_node, Identif
     array_join_nodes = std::move(array_join_column_expressions);
     for (auto & array_join_column_expression : array_join_nodes)
     {
-        auto it = scope.alias_name_to_expression_node.find(array_join_column_expression->getAlias());
-        if (it != scope.alias_name_to_expression_node.end())
+        auto it = scope.alias_name_to_expression_node->find(array_join_column_expression->getAlias());
+        if (it != scope.alias_name_to_expression_node->end())
         {
             auto & array_join_column_expression_typed = array_join_column_expression->as<ColumnNode &>();
             auto array_join_column = std::make_shared<ColumnNode>(array_join_column_expression_typed.getColumn(),
@@ -8037,8 +8058,10 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
         /// Clone is needed cause aliases share subtrees.
         /// If not clone, the same (shared) subtree could be resolved again with different (Nullable) type
         /// See 03023_group_by_use_nulls_analyzer_crashes
-        for (auto & [_, node] : scope.alias_name_to_expression_node)
-            node = node->clone();
+        for (auto & [key, node] : scope.alias_name_to_expression_node_before_group_by)
+            scope.alias_name_to_expression_node_after_group_by[key] = node->clone();
+
+        scope.alias_name_to_expression_node = &scope.alias_name_to_expression_node_after_group_by;
     }
 
     if (query_node_typed.hasHaving())
@@ -8115,8 +8138,8 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
 
         bool has_node_in_alias_table = false;
 
-        auto it = scope.alias_name_to_expression_node.find(node_alias);
-        if (it != scope.alias_name_to_expression_node.end())
+        auto it = scope.alias_name_to_expression_node->find(node_alias);
+        if (it != scope.alias_name_to_expression_node->end())
         {
             has_node_in_alias_table = true;
 
@@ -8175,7 +8198,7 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
 
     /// Remove aliases from expression and lambda nodes
 
-    for (auto & [_, node] : scope.alias_name_to_expression_node)
+    for (auto & [_, node] : *scope.alias_name_to_expression_node)
         node->removeAlias();
 
     for (auto & [_, node] : scope.alias_name_to_lambda_node)
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
index e2682487229..0eb9d94e85a 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
@@ -76,3 +76,13 @@ a	a
 \N	2
 \N	4
 \N	\N
+0	0	nan
+2	4	nan
+1	2	nan
+2	\N	nan
+0	\N	nan
+1	\N	nan
+\N	2	nan
+\N	0	nan
+\N	4	nan
+\N	\N	nan
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
index f2d4ac8acee..7311ce54e39 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
@@ -32,3 +32,14 @@ SELECT a, b
 FROM numbers(3)
 GROUP BY number as a, (number + number) as b WITH CUBE
 ORDER BY a, b;
+
+SELECT
+    a,
+    b,
+    cramersVBiasCorrected(a, b)
+FROM numbers(3)
+GROUP BY
+    number AS a,
+    number + number AS b
+    WITH CUBE
+SETTINGS group_by_use_nulls = 1;

From e09530ab755964b6da12718279ef345bf2800d43 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Fri, 8 Dec 2023 16:51:35 +0100
Subject: [PATCH 063/289] Fix making backup when multiple shards are used.

---
 src/Backups/BackupCoordinationLocal.cpp       | 24 ++++----
 src/Backups/BackupCoordinationLocal.h         | 12 ++--
 src/Backups/BackupCoordinationRemote.cpp      | 48 ++++++++--------
 src/Backups/BackupCoordinationRemote.h        | 12 ++--
 .../BackupCoordinationReplicatedTables.cpp    | 24 ++++----
 .../BackupCoordinationReplicatedTables.h      | 14 ++---
 src/Backups/BackupEntriesCollector.cpp        | 10 ++--
 src/Backups/BackupEntriesCollector.h          |  2 +-
 src/Backups/BackupUtils.cpp                   |  2 +-
 src/Backups/DDLAdjustingForBackupVisitor.cpp  | 10 +---
 src/Backups/DDLAdjustingForBackupVisitor.h    |  5 +-
 src/Backups/IBackupCoordination.h             | 12 ++--
 src/Storages/StorageReplicatedMergeTree.cpp   | 56 +++++--------------
 src/Storages/StorageReplicatedMergeTree.h     |  7 +--
 14 files changed, 100 insertions(+), 138 deletions(-)

diff --git a/src/Backups/BackupCoordinationLocal.cpp b/src/Backups/BackupCoordinationLocal.cpp
index 9964de2ad6e..efdc18cc29c 100644
--- a/src/Backups/BackupCoordinationLocal.cpp
+++ b/src/Backups/BackupCoordinationLocal.cpp
@@ -33,42 +33,42 @@ Strings BackupCoordinationLocal::waitForStage(const String &, std::chrono::milli
     return {};
 }
 
-void BackupCoordinationLocal::addReplicatedPartNames(const String & table_shared_id, const String & table_name_for_logs, const String & replica_name, const std::vector<PartNameAndChecksum> & part_names_and_checksums)
+void BackupCoordinationLocal::addReplicatedPartNames(const String & table_zk_path, const String & table_name_for_logs, const String & replica_name, const std::vector<PartNameAndChecksum> & part_names_and_checksums)
 {
     std::lock_guard lock{replicated_tables_mutex};
-    replicated_tables.addPartNames({table_shared_id, table_name_for_logs, replica_name, part_names_and_checksums});
+    replicated_tables.addPartNames({table_zk_path, table_name_for_logs, replica_name, part_names_and_checksums});
 }
 
-Strings BackupCoordinationLocal::getReplicatedPartNames(const String & table_shared_id, const String & replica_name) const
+Strings BackupCoordinationLocal::getReplicatedPartNames(const String & table_zk_path, const String & replica_name) const
 {
     std::lock_guard lock{replicated_tables_mutex};
-    return replicated_tables.getPartNames(table_shared_id, replica_name);
+    return replicated_tables.getPartNames(table_zk_path, replica_name);
 }
 
 
-void BackupCoordinationLocal::addReplicatedMutations(const String & table_shared_id, const String & table_name_for_logs, const String & replica_name, const std::vector<MutationInfo> & mutations)
+void BackupCoordinationLocal::addReplicatedMutations(const String & table_zk_path, const String & table_name_for_logs, const String & replica_name, const std::vector<MutationInfo> & mutations)
 {
     std::lock_guard lock{replicated_tables_mutex};
-    replicated_tables.addMutations({table_shared_id, table_name_for_logs, replica_name, mutations});
+    replicated_tables.addMutations({table_zk_path, table_name_for_logs, replica_name, mutations});
 }
 
-std::vector<IBackupCoordination::MutationInfo> BackupCoordinationLocal::getReplicatedMutations(const String & table_shared_id, const String & replica_name) const
+std::vector<IBackupCoordination::MutationInfo> BackupCoordinationLocal::getReplicatedMutations(const String & table_zk_path, const String & replica_name) const
 {
     std::lock_guard lock{replicated_tables_mutex};
-    return replicated_tables.getMutations(table_shared_id, replica_name);
+    return replicated_tables.getMutations(table_zk_path, replica_name);
 }
 
 
-void BackupCoordinationLocal::addReplicatedDataPath(const String & table_shared_id, const String & data_path)
+void BackupCoordinationLocal::addReplicatedDataPath(const String & table_zk_path, const String & data_path)
 {
     std::lock_guard lock{replicated_tables_mutex};
-    replicated_tables.addDataPath({table_shared_id, data_path});
+    replicated_tables.addDataPath({table_zk_path, data_path});
 }
 
-Strings BackupCoordinationLocal::getReplicatedDataPaths(const String & table_shared_id) const
+Strings BackupCoordinationLocal::getReplicatedDataPaths(const String & table_zk_path) const
 {
     std::lock_guard lock{replicated_tables_mutex};
-    return replicated_tables.getDataPaths(table_shared_id);
+    return replicated_tables.getDataPaths(table_zk_path);
 }
 
 
diff --git a/src/Backups/BackupCoordinationLocal.h b/src/Backups/BackupCoordinationLocal.h
index e0aa5dc67a4..a7f15c79649 100644
--- a/src/Backups/BackupCoordinationLocal.h
+++ b/src/Backups/BackupCoordinationLocal.h
@@ -29,16 +29,16 @@ public:
     Strings waitForStage(const String & stage_to_wait) override;
     Strings waitForStage(const String & stage_to_wait, std::chrono::milliseconds timeout) override;
 
-    void addReplicatedPartNames(const String & table_shared_id, const String & table_name_for_logs, const String & replica_name,
+    void addReplicatedPartNames(const String & table_zk_path, const String & table_name_for_logs, const String & replica_name,
                                 const std::vector<PartNameAndChecksum> & part_names_and_checksums) override;
-    Strings getReplicatedPartNames(const String & table_shared_id, const String & replica_name) const override;
+    Strings getReplicatedPartNames(const String & table_zk_path, const String & replica_name) const override;
 
-    void addReplicatedMutations(const String & table_shared_id, const String & table_name_for_logs, const String & replica_name,
+    void addReplicatedMutations(const String & table_zk_path, const String & table_name_for_logs, const String & replica_name,
                                 const std::vector<MutationInfo> & mutations) override;
-    std::vector<MutationInfo> getReplicatedMutations(const String & table_shared_id, const String & replica_name) const override;
+    std::vector<MutationInfo> getReplicatedMutations(const String & table_zk_path, const String & replica_name) const override;
 
-    void addReplicatedDataPath(const String & table_shared_id, const String & data_path) override;
-    Strings getReplicatedDataPaths(const String & table_shared_id) const override;
+    void addReplicatedDataPath(const String & table_zk_path, const String & data_path) override;
+    Strings getReplicatedDataPaths(const String & table_zk_path) const override;
 
     void addReplicatedAccessFilePath(const String & access_zk_path, AccessEntityType access_entity_type, const String & file_path) override;
     Strings getReplicatedAccessFilePaths(const String & access_zk_path, AccessEntityType access_entity_type) const override;
diff --git a/src/Backups/BackupCoordinationRemote.cpp b/src/Backups/BackupCoordinationRemote.cpp
index 455f45a7a77..f353062f628 100644
--- a/src/Backups/BackupCoordinationRemote.cpp
+++ b/src/Backups/BackupCoordinationRemote.cpp
@@ -358,7 +358,7 @@ String BackupCoordinationRemote::deserializeFromMultipleZooKeeperNodes(const Str
 
 
 void BackupCoordinationRemote::addReplicatedPartNames(
-    const String & table_shared_id,
+    const String & table_zk_path,
     const String & table_name_for_logs,
     const String & replica_name,
     const std::vector<PartNameAndChecksum> & part_names_and_checksums)
@@ -374,22 +374,22 @@ void BackupCoordinationRemote::addReplicatedPartNames(
     [&, &zk = holder.faulty_zookeeper]()
     {
         with_retries.renewZooKeeper(zk);
-        String path = zookeeper_path + "/repl_part_names/" + escapeForFileName(table_shared_id);
+        String path = zookeeper_path + "/repl_part_names/" + escapeForFileName(table_zk_path);
         zk->createIfNotExists(path, "");
         path += "/" + escapeForFileName(replica_name);
         zk->createIfNotExists(path, ReplicatedPartNames::serialize(part_names_and_checksums, table_name_for_logs));
     });
 }
 
-Strings BackupCoordinationRemote::getReplicatedPartNames(const String & table_shared_id, const String & replica_name) const
+Strings BackupCoordinationRemote::getReplicatedPartNames(const String & table_zk_path, const String & replica_name) const
 {
     std::lock_guard lock{replicated_tables_mutex};
     prepareReplicatedTables();
-    return replicated_tables->getPartNames(table_shared_id, replica_name);
+    return replicated_tables->getPartNames(table_zk_path, replica_name);
 }
 
 void BackupCoordinationRemote::addReplicatedMutations(
-    const String & table_shared_id,
+    const String & table_zk_path,
     const String & table_name_for_logs,
     const String & replica_name,
     const std::vector<MutationInfo> & mutations)
@@ -405,23 +405,23 @@ void BackupCoordinationRemote::addReplicatedMutations(
         [&, &zk = holder.faulty_zookeeper]()
         {
             with_retries.renewZooKeeper(zk);
-            String path = zookeeper_path + "/repl_mutations/" + escapeForFileName(table_shared_id);
+            String path = zookeeper_path + "/repl_mutations/" + escapeForFileName(table_zk_path);
             zk->createIfNotExists(path, "");
             path += "/" + escapeForFileName(replica_name);
             zk->createIfNotExists(path, ReplicatedMutations::serialize(mutations, table_name_for_logs));
         });
 }
 
-std::vector<IBackupCoordination::MutationInfo> BackupCoordinationRemote::getReplicatedMutations(const String & table_shared_id, const String & replica_name) const
+std::vector<IBackupCoordination::MutationInfo> BackupCoordinationRemote::getReplicatedMutations(const String & table_zk_path, const String & replica_name) const
 {
     std::lock_guard lock{replicated_tables_mutex};
     prepareReplicatedTables();
-    return replicated_tables->getMutations(table_shared_id, replica_name);
+    return replicated_tables->getMutations(table_zk_path, replica_name);
 }
 
 
 void BackupCoordinationRemote::addReplicatedDataPath(
-    const String & table_shared_id, const String & data_path)
+    const String & table_zk_path, const String & data_path)
 {
     {
         std::lock_guard lock{replicated_tables_mutex};
@@ -434,18 +434,18 @@ void BackupCoordinationRemote::addReplicatedDataPath(
     [&, &zk = holder.faulty_zookeeper]()
     {
         with_retries.renewZooKeeper(zk);
-        String path = zookeeper_path + "/repl_data_paths/" + escapeForFileName(table_shared_id);
+        String path = zookeeper_path + "/repl_data_paths/" + escapeForFileName(table_zk_path);
         zk->createIfNotExists(path, "");
         path += "/" + escapeForFileName(data_path);
         zk->createIfNotExists(path, "");
     });
 }
 
-Strings BackupCoordinationRemote::getReplicatedDataPaths(const String & table_shared_id) const
+Strings BackupCoordinationRemote::getReplicatedDataPaths(const String & table_zk_path) const
 {
     std::lock_guard lock{replicated_tables_mutex};
     prepareReplicatedTables();
-    return replicated_tables->getDataPaths(table_shared_id);
+    return replicated_tables->getDataPaths(table_zk_path);
 }
 
 
@@ -464,16 +464,16 @@ void BackupCoordinationRemote::prepareReplicatedTables() const
             with_retries.renewZooKeeper(zk);
 
             String path = zookeeper_path + "/repl_part_names";
-            for (const String & escaped_table_shared_id : zk->getChildren(path))
+            for (const String & escaped_table_zk_path : zk->getChildren(path))
             {
-                String table_shared_id = unescapeForFileName(escaped_table_shared_id);
-                String path2 = path + "/" + escaped_table_shared_id;
+                String table_zk_path = unescapeForFileName(escaped_table_zk_path);
+                String path2 = path + "/" + escaped_table_zk_path;
                 for (const String & escaped_replica_name : zk->getChildren(path2))
                 {
                     String replica_name = unescapeForFileName(escaped_replica_name);
                     auto part_names = ReplicatedPartNames::deserialize(zk->get(path2 + "/" + escaped_replica_name));
                     part_names_for_replicated_tables.push_back(
-                        {table_shared_id, part_names.table_name_for_logs, replica_name, part_names.part_names_and_checksums});
+                        {table_zk_path, part_names.table_name_for_logs, replica_name, part_names.part_names_and_checksums});
                 }
             }
         });
@@ -489,16 +489,16 @@ void BackupCoordinationRemote::prepareReplicatedTables() const
             with_retries.renewZooKeeper(zk);
 
             String path = zookeeper_path + "/repl_mutations";
-            for (const String & escaped_table_shared_id : zk->getChildren(path))
+            for (const String & escaped_table_zk_path : zk->getChildren(path))
             {
-                String table_shared_id = unescapeForFileName(escaped_table_shared_id);
-                String path2 = path + "/" + escaped_table_shared_id;
+                String table_zk_path = unescapeForFileName(escaped_table_zk_path);
+                String path2 = path + "/" + escaped_table_zk_path;
                 for (const String & escaped_replica_name : zk->getChildren(path2))
                 {
                     String replica_name = unescapeForFileName(escaped_replica_name);
                     auto mutations = ReplicatedMutations::deserialize(zk->get(path2 + "/" + escaped_replica_name));
                     mutations_for_replicated_tables.push_back(
-                        {table_shared_id, mutations.table_name_for_logs, replica_name, mutations.mutations});
+                        {table_zk_path, mutations.table_name_for_logs, replica_name, mutations.mutations});
                 }
             }
         });
@@ -514,14 +514,14 @@ void BackupCoordinationRemote::prepareReplicatedTables() const
             with_retries.renewZooKeeper(zk);
 
             String path = zookeeper_path + "/repl_data_paths";
-            for (const String & escaped_table_shared_id : zk->getChildren(path))
+            for (const String & escaped_table_zk_path : zk->getChildren(path))
             {
-                String table_shared_id = unescapeForFileName(escaped_table_shared_id);
-                String path2 = path + "/" + escaped_table_shared_id;
+                String table_zk_path = unescapeForFileName(escaped_table_zk_path);
+                String path2 = path + "/" + escaped_table_zk_path;
                 for (const String & escaped_data_path : zk->getChildren(path2))
                 {
                     String data_path = unescapeForFileName(escaped_data_path);
-                    data_paths_for_replicated_tables.push_back({table_shared_id, data_path});
+                    data_paths_for_replicated_tables.push_back({table_zk_path, data_path});
                 }
             }
         });
diff --git a/src/Backups/BackupCoordinationRemote.h b/src/Backups/BackupCoordinationRemote.h
index ce891699bd2..7a56b1a4eb8 100644
--- a/src/Backups/BackupCoordinationRemote.h
+++ b/src/Backups/BackupCoordinationRemote.h
@@ -41,23 +41,23 @@ public:
     Strings waitForStage(const String & stage_to_wait, std::chrono::milliseconds timeout) override;
 
     void addReplicatedPartNames(
-        const String & table_shared_id,
+        const String & table_zk_path,
         const String & table_name_for_logs,
         const String & replica_name,
         const std::vector<PartNameAndChecksum> & part_names_and_checksums) override;
 
-    Strings getReplicatedPartNames(const String & table_shared_id, const String & replica_name) const override;
+    Strings getReplicatedPartNames(const String & table_zk_path, const String & replica_name) const override;
 
     void addReplicatedMutations(
-        const String & table_shared_id,
+        const String & table_zk_path,
         const String & table_name_for_logs,
         const String & replica_name,
         const std::vector<MutationInfo> & mutations) override;
 
-    std::vector<MutationInfo> getReplicatedMutations(const String & table_shared_id, const String & replica_name) const override;
+    std::vector<MutationInfo> getReplicatedMutations(const String & table_zk_path, const String & replica_name) const override;
 
-    void addReplicatedDataPath(const String & table_shared_id, const String & data_path) override;
-    Strings getReplicatedDataPaths(const String & table_shared_id) const override;
+    void addReplicatedDataPath(const String & table_zk_path, const String & data_path) override;
+    Strings getReplicatedDataPaths(const String & table_zk_path) const override;
 
     void addReplicatedAccessFilePath(const String & access_zk_path, AccessEntityType access_entity_type, const String & file_path) override;
     Strings getReplicatedAccessFilePaths(const String & access_zk_path, AccessEntityType access_entity_type) const override;
diff --git a/src/Backups/BackupCoordinationReplicatedTables.cpp b/src/Backups/BackupCoordinationReplicatedTables.cpp
index 1cbb88acb82..a435667f79a 100644
--- a/src/Backups/BackupCoordinationReplicatedTables.cpp
+++ b/src/Backups/BackupCoordinationReplicatedTables.cpp
@@ -151,7 +151,7 @@ BackupCoordinationReplicatedTables::~BackupCoordinationReplicatedTables() = defa
 
 void BackupCoordinationReplicatedTables::addPartNames(PartNamesForTableReplica && part_names)
 {
-    const auto & table_shared_id = part_names.table_shared_id;
+    const auto & table_zk_path = part_names.table_zk_path;
     const auto & table_name_for_logs = part_names.table_name_for_logs;
     const auto & replica_name = part_names.replica_name;
     const auto & part_names_and_checksums = part_names.part_names_and_checksums;
@@ -159,7 +159,7 @@ void BackupCoordinationReplicatedTables::addPartNames(PartNamesForTableReplica &
     if (prepared)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "addPartNames() must not be called after preparing");
 
-    auto & table_info = table_infos[table_shared_id];
+    auto & table_info = table_infos[table_zk_path];
     table_info.table_name_for_logs = table_name_for_logs;
 
     if (!table_info.covered_parts_finder)
@@ -200,11 +200,11 @@ void BackupCoordinationReplicatedTables::addPartNames(PartNamesForTableReplica &
     }
 }
 
-Strings BackupCoordinationReplicatedTables::getPartNames(const String & table_shared_id, const String & replica_name) const
+Strings BackupCoordinationReplicatedTables::getPartNames(const String & table_zk_path, const String & replica_name) const
 {
     prepare();
 
-    auto it = table_infos.find(table_shared_id);
+    auto it = table_infos.find(table_zk_path);
     if (it == table_infos.end())
         return {};
 
@@ -218,7 +218,7 @@ Strings BackupCoordinationReplicatedTables::getPartNames(const String & table_sh
 
 void BackupCoordinationReplicatedTables::addMutations(MutationsForTableReplica && mutations_for_table_replica)
 {
-    const auto & table_shared_id = mutations_for_table_replica.table_shared_id;
+    const auto & table_zk_path = mutations_for_table_replica.table_zk_path;
     const auto & table_name_for_logs = mutations_for_table_replica.table_name_for_logs;
     const auto & replica_name = mutations_for_table_replica.replica_name;
     const auto & mutations = mutations_for_table_replica.mutations;
@@ -226,7 +226,7 @@ void BackupCoordinationReplicatedTables::addMutations(MutationsForTableReplica &
     if (prepared)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "addMutations() must not be called after preparing");
 
-    auto & table_info = table_infos[table_shared_id];
+    auto & table_info = table_infos[table_zk_path];
     table_info.table_name_for_logs = table_name_for_logs;
     for (const auto & [mutation_id, mutation_entry] : mutations)
         table_info.mutations.emplace(mutation_id, mutation_entry);
@@ -236,11 +236,11 @@ void BackupCoordinationReplicatedTables::addMutations(MutationsForTableReplica &
 }
 
 std::vector<MutationInfo>
-BackupCoordinationReplicatedTables::getMutations(const String & table_shared_id, const String & replica_name) const
+BackupCoordinationReplicatedTables::getMutations(const String & table_zk_path, const String & replica_name) const
 {
     prepare();
 
-    auto it = table_infos.find(table_shared_id);
+    auto it = table_infos.find(table_zk_path);
     if (it == table_infos.end())
         return {};
 
@@ -257,16 +257,16 @@ BackupCoordinationReplicatedTables::getMutations(const String & table_shared_id,
 
 void BackupCoordinationReplicatedTables::addDataPath(DataPathForTableReplica && data_path_for_table_replica)
 {
-    const auto & table_shared_id = data_path_for_table_replica.table_shared_id;
+    const auto & table_zk_path = data_path_for_table_replica.table_zk_path;
     const auto & data_path = data_path_for_table_replica.data_path;
 
-    auto & table_info = table_infos[table_shared_id];
+    auto & table_info = table_infos[table_zk_path];
     table_info.data_paths.emplace(data_path);
 }
 
-Strings BackupCoordinationReplicatedTables::getDataPaths(const String & table_shared_id) const
+Strings BackupCoordinationReplicatedTables::getDataPaths(const String & table_zk_path) const
 {
-    auto it = table_infos.find(table_shared_id);
+    auto it = table_infos.find(table_zk_path);
     if (it == table_infos.end())
         return {};
 
diff --git a/src/Backups/BackupCoordinationReplicatedTables.h b/src/Backups/BackupCoordinationReplicatedTables.h
index 74f21eb9c7c..50ab56aef75 100644
--- a/src/Backups/BackupCoordinationReplicatedTables.h
+++ b/src/Backups/BackupCoordinationReplicatedTables.h
@@ -40,7 +40,7 @@ public:
 
     struct PartNamesForTableReplica
     {
-        String table_shared_id;
+        String table_zk_path;
         String table_name_for_logs;
         String replica_name;
         std::vector<PartNameAndChecksum> part_names_and_checksums;
@@ -55,13 +55,13 @@ public:
     /// Returns the names of the parts which a specified replica of a replicated table should put to the backup.
     /// This is the same list as it was added by call of the function addPartNames() but without duplications and without
     /// parts covered by another parts.
-    Strings getPartNames(const String & table_shared_id, const String & replica_name) const;
+    Strings getPartNames(const String & table_zk_path, const String & replica_name) const;
 
     using MutationInfo = IBackupCoordination::MutationInfo;
 
     struct MutationsForTableReplica
     {
-        String table_shared_id;
+        String table_zk_path;
         String table_name_for_logs;
         String replica_name;
         std::vector<MutationInfo> mutations;
@@ -71,11 +71,11 @@ public:
     void addMutations(MutationsForTableReplica && mutations_for_table_replica);
 
     /// Returns all mutations of a replicated table which are not finished for some data parts added by addReplicatedPartNames().
-    std::vector<MutationInfo> getMutations(const String & table_shared_id, const String & replica_name) const;
+    std::vector<MutationInfo> getMutations(const String & table_zk_path, const String & replica_name) const;
 
     struct DataPathForTableReplica
     {
-        String table_shared_id;
+        String table_zk_path;
         String data_path;
     };
 
@@ -85,7 +85,7 @@ public:
     void addDataPath(DataPathForTableReplica && data_path_for_table_replica);
 
     /// Returns all the data paths in backup added for a replicated table (see also addReplicatedDataPath()).
-    Strings getDataPaths(const String & table_shared_id) const;
+    Strings getDataPaths(const String & table_zk_path) const;
 
 private:
     void prepare() const;
@@ -110,7 +110,7 @@ private:
         std::unordered_set<String> data_paths;
     };
 
-    std::map<String /* table_shared_id */, TableInfo> table_infos; /// Should be ordered because we need this map to be in the same order on every replica.
+    std::map<String /* table_zk_path */, TableInfo> table_infos; /// Should be ordered because we need this map to be in the same order on every replica.
     mutable bool prepared = false;
 };
 
diff --git a/src/Backups/BackupEntriesCollector.cpp b/src/Backups/BackupEntriesCollector.cpp
index cc014c279cc..136e3c49321 100644
--- a/src/Backups/BackupEntriesCollector.cpp
+++ b/src/Backups/BackupEntriesCollector.cpp
@@ -11,6 +11,7 @@
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/formatAST.h>
 #include <Storages/IStorage.h>
+#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
 #include <base/chrono_io.h>
 #include <base/insertAtEnd.h>
 #include <base/scope_guard.h>
@@ -758,7 +759,7 @@ void BackupEntriesCollector::makeBackupEntriesForDatabasesDefs()
         checkIsQueryCancelled();
 
         ASTPtr new_create_query = database_info.create_database_query;
-        adjustCreateQueryForBackup(new_create_query, context->getGlobalContext(), nullptr);
+        adjustCreateQueryForBackup(new_create_query, context->getGlobalContext());
         renameDatabaseAndTableNameInCreateQuery(new_create_query, renaming_map, context->getGlobalContext());
 
         const String & metadata_path_in_backup = database_info.metadata_path_in_backup;
@@ -775,7 +776,8 @@ void BackupEntriesCollector::makeBackupEntriesForTablesDefs()
         checkIsQueryCancelled();
 
         ASTPtr new_create_query = table_info.create_table_query;
-        adjustCreateQueryForBackup(new_create_query, context->getGlobalContext(), &table_info.replicated_table_shared_id);
+        table_info.replicated_table_zk_path = tryExtractZkPathFromCreateQuery(*new_create_query, context->getGlobalContext());
+        adjustCreateQueryForBackup(new_create_query, context->getGlobalContext());
         renameDatabaseAndTableNameInCreateQuery(new_create_query, renaming_map, context->getGlobalContext());
 
         const String & metadata_path_in_backup = table_info.metadata_path_in_backup;
@@ -814,8 +816,8 @@ void BackupEntriesCollector::makeBackupEntriesForTableData(const QualifiedTableN
         /// If this table is replicated in this case we call IBackupCoordination::addReplicatedDataPath() which will cause
         /// other replicas to fill the storage's data in the backup.
         /// If this table is not replicated we'll do nothing leaving the storage's data empty in the backup.
-        if (table_info.replicated_table_shared_id)
-            backup_coordination->addReplicatedDataPath(*table_info.replicated_table_shared_id, data_path_in_backup);
+        if (table_info.replicated_table_zk_path)
+            backup_coordination->addReplicatedDataPath(*table_info.replicated_table_zk_path, data_path_in_backup);
         return;
     }
 
diff --git a/src/Backups/BackupEntriesCollector.h b/src/Backups/BackupEntriesCollector.h
index 01e8d594334..c7bce077a2d 100644
--- a/src/Backups/BackupEntriesCollector.h
+++ b/src/Backups/BackupEntriesCollector.h
@@ -164,7 +164,7 @@ private:
         ASTPtr create_table_query;
         String metadata_path_in_backup;
         std::filesystem::path data_path_in_backup;
-        std::optional<String> replicated_table_shared_id;
+        std::optional<String> replicated_table_zk_path;
         std::optional<ASTs> partitions;
     };
 
diff --git a/src/Backups/BackupUtils.cpp b/src/Backups/BackupUtils.cpp
index fb448fb64ad..fa8ed5855dd 100644
--- a/src/Backups/BackupUtils.cpp
+++ b/src/Backups/BackupUtils.cpp
@@ -103,7 +103,7 @@ bool compareRestoredTableDef(const IAST & restored_table_create_query, const IAS
     auto adjust_before_comparison = [&](const IAST & query) -> ASTPtr
     {
         auto new_query = query.clone();
-        adjustCreateQueryForBackup(new_query, global_context, nullptr);
+        adjustCreateQueryForBackup(new_query, global_context);
         ASTCreateQuery & create = typeid_cast<ASTCreateQuery &>(*new_query);
         create.setUUID({});
         create.if_not_exists = false;
diff --git a/src/Backups/DDLAdjustingForBackupVisitor.cpp b/src/Backups/DDLAdjustingForBackupVisitor.cpp
index 5ea91094b75..7e5ce91629b 100644
--- a/src/Backups/DDLAdjustingForBackupVisitor.cpp
+++ b/src/Backups/DDLAdjustingForBackupVisitor.cpp
@@ -27,9 +27,6 @@ namespace
     {
         /// Precondition: engine_name.starts_with("Replicated") && engine_name.ends_with("MergeTree")
 
-        if (data.replicated_table_shared_id)
-            *data.replicated_table_shared_id = StorageReplicatedMergeTree::tryGetTableSharedIDFromCreateQuery(*data.create_query, data.global_context);
-
         /// Before storing the metadata in a backup we have to find a zookeeper path in its definition and turn the table's UUID in there
         /// back into "{uuid}", and also we probably can remove the zookeeper path and replica name if they're default.
         /// So we're kind of reverting what we had done to the table's definition in registerStorageMergeTree.cpp before we created this table.
@@ -98,12 +95,9 @@ void DDLAdjustingForBackupVisitor::visit(ASTPtr ast, const Data & data)
         visitCreateQuery(*create, data);
 }
 
-void adjustCreateQueryForBackup(ASTPtr ast, const ContextPtr & global_context, std::optional<String> * replicated_table_shared_id)
+void adjustCreateQueryForBackup(ASTPtr ast, const ContextPtr & global_context)
 {
-    if (replicated_table_shared_id)
-        *replicated_table_shared_id = {};
-
-    DDLAdjustingForBackupVisitor::Data data{ast, global_context, replicated_table_shared_id};
+    DDLAdjustingForBackupVisitor::Data data{ast, global_context};
     DDLAdjustingForBackupVisitor::Visitor{data}.visit(ast);
 }
 
diff --git a/src/Backups/DDLAdjustingForBackupVisitor.h b/src/Backups/DDLAdjustingForBackupVisitor.h
index 63353dcc000..f0508434e02 100644
--- a/src/Backups/DDLAdjustingForBackupVisitor.h
+++ b/src/Backups/DDLAdjustingForBackupVisitor.h
@@ -12,9 +12,7 @@ class Context;
 using ContextPtr = std::shared_ptr<const Context>;
 
 /// Changes a create query to a form which is appropriate or suitable for saving in a backup.
-/// Also extracts a replicated table's shared ID from the create query if this is a create query for a replicated table.
-/// `replicated_table_shared_id` can be null if you don't need that.
-void adjustCreateQueryForBackup(ASTPtr ast, const ContextPtr & global_context, std::optional<String> * replicated_table_shared_id);
+void adjustCreateQueryForBackup(ASTPtr ast, const ContextPtr & global_context);
 
 /// Visits ASTCreateQuery and changes it to a form which is appropriate or suitable for saving in a backup.
 class DDLAdjustingForBackupVisitor
@@ -24,7 +22,6 @@ public:
     {
         ASTPtr create_query;
         ContextPtr global_context;
-        std::optional<String> * replicated_table_shared_id = nullptr;
     };
 
     using Visitor = InDepthNodeVisitor<DDLAdjustingForBackupVisitor, false>;
diff --git a/src/Backups/IBackupCoordination.h b/src/Backups/IBackupCoordination.h
index f80b5dee883..4a9f8a23855 100644
--- a/src/Backups/IBackupCoordination.h
+++ b/src/Backups/IBackupCoordination.h
@@ -36,13 +36,13 @@ public:
     /// Multiple replicas of the replicated table call this function and then the added part names can be returned by call of the function
     /// getReplicatedPartNames().
     /// Checksums are used only to control that parts under the same names on different replicas are the same.
-    virtual void addReplicatedPartNames(const String & table_shared_id, const String & table_name_for_logs, const String & replica_name,
+    virtual void addReplicatedPartNames(const String & table_zk_path, const String & table_name_for_logs, const String & replica_name,
                                         const std::vector<PartNameAndChecksum> & part_names_and_checksums) = 0;
 
     /// Returns the names of the parts which a specified replica of a replicated table should put to the backup.
     /// This is the same list as it was added by call of the function addReplicatedPartNames() but without duplications and without
     /// parts covered by another parts.
-    virtual Strings getReplicatedPartNames(const String & table_shared_id, const String & replica_name) const = 0;
+    virtual Strings getReplicatedPartNames(const String & table_zk_path, const String & replica_name) const = 0;
 
     struct MutationInfo
     {
@@ -51,10 +51,10 @@ public:
     };
 
     /// Adds information about mutations of a replicated table.
-    virtual void addReplicatedMutations(const String & table_shared_id, const String & table_name_for_logs, const String & replica_name, const std::vector<MutationInfo> & mutations) = 0;
+    virtual void addReplicatedMutations(const String & table_zk_path, const String & table_name_for_logs, const String & replica_name, const std::vector<MutationInfo> & mutations) = 0;
 
     /// Returns all mutations of a replicated table which are not finished for some data parts added by addReplicatedPartNames().
-    virtual std::vector<MutationInfo> getReplicatedMutations(const String & table_shared_id, const String & replica_name) const = 0;
+    virtual std::vector<MutationInfo> getReplicatedMutations(const String & table_zk_path, const String & replica_name) const = 0;
 
     /// Adds information about KeeperMap tables
     virtual void addKeeperMapTable(const String & table_zookeeper_root_path, const String & table_id, const String & data_path_in_backup) = 0;
@@ -65,10 +65,10 @@ public:
     /// Adds a data path in backup for a replicated table.
     /// Multiple replicas of the replicated table call this function and then all the added paths can be returned by call of the function
     /// getReplicatedDataPaths().
-    virtual void addReplicatedDataPath(const String & table_shared_id, const String & data_path) = 0;
+    virtual void addReplicatedDataPath(const String & table_zk_path, const String & data_path) = 0;
 
     /// Returns all the data paths in backup added for a replicated table (see also addReplicatedDataPath()).
-    virtual Strings getReplicatedDataPaths(const String & table_shared_id) const = 0;
+    virtual Strings getReplicatedDataPaths(const String & table_zk_path) const = 0;
 
     /// Adds a path to access.txt file keeping access entities of a ReplicatedAccessStorage.
     virtual void addReplicatedAccessFilePath(const String & access_zk_path, AccessEntityType access_entity_type, const String & file_path) = 0;
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index c425035dfba..58d1846915f 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -187,7 +187,6 @@ namespace ErrorCodes
     extern const int NOT_INITIALIZED;
     extern const int TOO_LARGE_DISTRIBUTED_DEPTH;
     extern const int TABLE_IS_DROPPED;
-    extern const int CANNOT_BACKUP_TABLE;
     extern const int SUPPORT_IS_DISABLED;
     extern const int FAULT_INJECTED;
     extern const int CANNOT_FORGET_PARTITION;
@@ -310,8 +309,9 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
                     true,                   /// require_part_metadata
                     mode,
                     [this] (const std::string & name) { enqueuePartForCheck(name); })
-    , zookeeper_name(zkutil::extractZooKeeperName(zookeeper_path_))
-    , zookeeper_path(zkutil::extractZooKeeperPath(zookeeper_path_, /* check_starts_with_slash */ mode <= LoadingStrictnessLevel::CREATE, log.load()))
+    , full_zookeeper_path(zookeeper_path_)
+    , zookeeper_name(zkutil::extractZooKeeperName(full_zookeeper_path))
+    , zookeeper_path(zkutil::extractZooKeeperPath(full_zookeeper_path, /* check_starts_with_slash */ mode <= LoadingStrictnessLevel::CREATE, log.load()))
     , replica_name(replica_name_)
     , replica_path(fs::path(zookeeper_path) / "replicas" / replica_name_)
     , reader(*this)
@@ -9242,24 +9242,6 @@ void StorageReplicatedMergeTree::createTableSharedID() const
 }
 
 
-std::optional<String> StorageReplicatedMergeTree::tryGetTableSharedIDFromCreateQuery(const IAST & create_query, const ContextPtr & global_context)
-{
-    auto zk_path = tryExtractZkPathFromCreateQuery(create_query, global_context);
-    if (!zk_path)
-        return {};
-
-    String zk_name = zkutil::extractZooKeeperName(*zk_path);
-    zk_path = zkutil::extractZooKeeperPath(*zk_path, false, nullptr);
-    zkutil::ZooKeeperPtr zookeeper = (zk_name == getDefaultZooKeeperName()) ? global_context->getZooKeeper() : global_context->getAuxiliaryZooKeeper(zk_name);
-
-    String id;
-    if (!zookeeper->tryGet(fs::path(*zk_path) / "table_shared_id", id))
-        return {};
-
-    return id;
-}
-
-
 zkutil::EphemeralNodeHolderPtr StorageReplicatedMergeTree::lockSharedDataTemporary(const String & part_name, const String & part_id, const DiskPtr & disk) const
 {
     auto settings = getSettings();
@@ -10419,21 +10401,10 @@ void StorageReplicatedMergeTree::adjustCreateQueryForBackup(ASTPtr & create_quer
         auto metadata_diff = ReplicatedMergeTreeTableMetadata(*this, current_metadata).checkAndFindDiff(metadata_from_entry, current_metadata->getColumns(), getContext());
         auto adjusted_metadata = metadata_diff.getNewMetadata(columns_from_entry, getContext(), *current_metadata);
         applyMetadataChangesToCreateQuery(create_query, adjusted_metadata);
-
-        /// Check that tryGetTableSharedIDFromCreateQuery() works for this storage.
-        auto actual_table_shared_id = getTableSharedID();
-        auto expected_table_shared_id = tryGetTableSharedIDFromCreateQuery(*create_query, getContext());
-        if (actual_table_shared_id != expected_table_shared_id)
-        {
-            throw Exception(ErrorCodes::CANNOT_BACKUP_TABLE, "Table {} has its shared ID different from one from the create query: "
-                            "actual shared id = {}, expected shared id = {}, create query = {}",
-                            getStorageID().getNameForLogs(), actual_table_shared_id, expected_table_shared_id.value_or("nullopt"),
-                            create_query);
-        }
     }
     catch (...)
     {
-        /// We can continue making a backup with non-adjusted name.
+        /// We can continue making a backup with non-adjusted query.
         tryLogCurrentException(log, "Failed to adjust the create query of this table for backup");
     }
 }
@@ -10459,8 +10430,8 @@ void StorageReplicatedMergeTree::backupData(
     auto parts_backup_entries = backupParts(data_parts, /* data_path_in_backup */ "", backup_settings, read_settings, local_context);
 
     auto coordination = backup_entries_collector.getBackupCoordination();
-    String shared_id = getTableSharedID();
-    coordination->addReplicatedDataPath(shared_id, data_path_in_backup);
+
+    coordination->addReplicatedDataPath(full_zookeeper_path, data_path_in_backup);
 
     using PartNameAndChecksum = IBackupCoordination::PartNameAndChecksum;
     std::vector<PartNameAndChecksum> part_names_with_hashes;
@@ -10469,7 +10440,7 @@ void StorageReplicatedMergeTree::backupData(
         part_names_with_hashes.emplace_back(PartNameAndChecksum{part_backup_entries.part_name, part_backup_entries.part_checksum});
 
     /// Send our list of part names to the coordination (to compare with other replicas).
-    coordination->addReplicatedPartNames(shared_id, getStorageID().getFullTableName(), getReplicaName(), part_names_with_hashes);
+    coordination->addReplicatedPartNames(full_zookeeper_path, getStorageID().getFullTableName(), getReplicaName(), part_names_with_hashes);
 
     /// Send a list of mutations to the coordination too (we need to find the mutations which are not finished for added part names).
     {
@@ -10511,25 +10482,25 @@ void StorageReplicatedMergeTree::backupData(
             }
 
             if (!mutation_infos.empty())
-                coordination->addReplicatedMutations(shared_id, getStorageID().getFullTableName(), getReplicaName(), mutation_infos);
+                coordination->addReplicatedMutations(full_zookeeper_path, getStorageID().getFullTableName(), getReplicaName(), mutation_infos);
         }
     }
 
     /// This task will be executed after all replicas have collected their parts and the coordination is ready to
     /// give us the final list of parts to add to the BackupEntriesCollector.
-    auto post_collecting_task = [shared_id,
+    auto post_collecting_task = [my_full_zookeeper_path = full_zookeeper_path,
                                  my_replica_name = getReplicaName(),
                                  coordination,
                                  my_parts_backup_entries = std::move(parts_backup_entries),
                                  &backup_entries_collector]()
     {
-        Strings data_paths = coordination->getReplicatedDataPaths(shared_id);
+        Strings data_paths = coordination->getReplicatedDataPaths(my_full_zookeeper_path);
         std::vector<fs::path> data_paths_fs;
         data_paths_fs.reserve(data_paths.size());
         for (const auto & data_path : data_paths)
             data_paths_fs.push_back(data_path);
 
-        Strings part_names = coordination->getReplicatedPartNames(shared_id, my_replica_name);
+        Strings part_names = coordination->getReplicatedPartNames(my_full_zookeeper_path, my_replica_name);
         std::unordered_set<std::string_view> part_names_set{part_names.begin(), part_names.end()};
 
         for (const auto & part_backup_entries : my_parts_backup_entries)
@@ -10542,7 +10513,7 @@ void StorageReplicatedMergeTree::backupData(
             }
         }
 
-        auto mutation_infos = coordination->getReplicatedMutations(shared_id, my_replica_name);
+        auto mutation_infos = coordination->getReplicatedMutations(my_full_zookeeper_path, my_replica_name);
         for (const auto & mutation_info : mutation_infos)
         {
             auto backup_entry = ReplicatedMergeTreeMutationEntry::parse(mutation_info.entry, mutation_info.id).backup();
@@ -10556,8 +10527,7 @@ void StorageReplicatedMergeTree::backupData(
 
 void StorageReplicatedMergeTree::restoreDataFromBackup(RestorerFromBackup & restorer, const String & data_path_in_backup, const std::optional<ASTs> & partitions)
 {
-    String full_zk_path = getZooKeeperName() + getZooKeeperPath();
-    if (!restorer.getRestoreCoordination()->acquireInsertingDataIntoReplicatedTable(full_zk_path))
+    if (!restorer.getRestoreCoordination()->acquireInsertingDataIntoReplicatedTable(full_zookeeper_path))
     {
         /// Other replica is already restoring the data of this table.
         /// We'll get them later due to replication, it's not necessary to read it from the backup.
diff --git a/src/Storages/StorageReplicatedMergeTree.h b/src/Storages/StorageReplicatedMergeTree.h
index c472c11e7f8..7f33c82e5c2 100644
--- a/src/Storages/StorageReplicatedMergeTree.h
+++ b/src/Storages/StorageReplicatedMergeTree.h
@@ -330,17 +330,14 @@ public:
 
     // Return default or custom zookeeper name for table
     const String & getZooKeeperName() const { return zookeeper_name; }
-
     const String & getZooKeeperPath() const { return zookeeper_path; }
+    const String & getFullZooKeeperPath() const { return full_zookeeper_path; }
 
     // Return table id, common for different replicas
     String getTableSharedID() const override;
 
     std::map<std::string, MutationCommands> getUnfinishedMutationCommands() const override;
 
-    /// Returns the same as getTableSharedID(), but extracts it from a create query.
-    static std::optional<String> tryGetTableSharedIDFromCreateQuery(const IAST & create_query, const ContextPtr & global_context);
-
     static const String & getDefaultZooKeeperName() { return default_zookeeper_name; }
 
     /// Check if there are new broken disks and enqueue part recovery tasks.
@@ -420,9 +417,11 @@ private:
 
     bool is_readonly_metric_set = false;
 
+    const String full_zookeeper_path;
     static const String default_zookeeper_name;
     const String zookeeper_name;
     const String zookeeper_path;
+
     const String replica_name;
     const String replica_path;
 

From 6e579312633f2c0abb8784f122bfc75559a5d05a Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Thu, 25 Apr 2024 19:24:36 +0200
Subject: [PATCH 064/289] Get rid of code duplication in
 extractZkPathFromCreateQuery().

---
 src/Backups/BackupEntriesCollector.cpp        |   4 +-
 .../extractZkPathFromCreateQuery.cpp          |  61 ---
 .../MergeTree/extractZkPathFromCreateQuery.h  |  19 -
 ...tractZooKeeperPathFromReplicatedTableDef.h |  18 +
 .../MergeTree/registerStorageMergeTree.cpp    | 401 +++++++++++-------
 src/Storages/StorageReplicatedMergeTree.cpp   |   1 -
 6 files changed, 272 insertions(+), 232 deletions(-)
 delete mode 100644 src/Storages/MergeTree/extractZkPathFromCreateQuery.cpp
 delete mode 100644 src/Storages/MergeTree/extractZkPathFromCreateQuery.h
 create mode 100644 src/Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h

diff --git a/src/Backups/BackupEntriesCollector.cpp b/src/Backups/BackupEntriesCollector.cpp
index 136e3c49321..d91cf47c4d3 100644
--- a/src/Backups/BackupEntriesCollector.cpp
+++ b/src/Backups/BackupEntriesCollector.cpp
@@ -11,7 +11,7 @@
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/formatAST.h>
 #include <Storages/IStorage.h>
-#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
+#include <Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h>
 #include <base/chrono_io.h>
 #include <base/insertAtEnd.h>
 #include <base/scope_guard.h>
@@ -776,7 +776,7 @@ void BackupEntriesCollector::makeBackupEntriesForTablesDefs()
         checkIsQueryCancelled();
 
         ASTPtr new_create_query = table_info.create_table_query;
-        table_info.replicated_table_zk_path = tryExtractZkPathFromCreateQuery(*new_create_query, context->getGlobalContext());
+        table_info.replicated_table_zk_path = extractZooKeeperPathFromReplicatedTableDef(new_create_query->as<const ASTCreateQuery &>(), context);
         adjustCreateQueryForBackup(new_create_query, context->getGlobalContext());
         renameDatabaseAndTableNameInCreateQuery(new_create_query, renaming_map, context->getGlobalContext());
 
diff --git a/src/Storages/MergeTree/extractZkPathFromCreateQuery.cpp b/src/Storages/MergeTree/extractZkPathFromCreateQuery.cpp
deleted file mode 100644
index 8ea732b0243..00000000000
--- a/src/Storages/MergeTree/extractZkPathFromCreateQuery.cpp
+++ /dev/null
@@ -1,61 +0,0 @@
-#include <Databases/DatabaseReplicatedHelpers.h>
-#include <Databases/IDatabase.h>
-#include <Interpreters/Context.h>
-#include <Interpreters/DatabaseCatalog.h>
-#include <Parsers/ASTCreateQuery.h>
-#include <Parsers/ASTFunction.h>
-#include <Parsers/ASTLiteral.h>
-#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
-#include <Common/Macros.h>
-
-
-namespace DB
-{
-
-std::optional<String> tryExtractZkPathFromCreateQuery(const IAST & create_query, const ContextPtr & global_context)
-{
-    const auto * create = create_query.as<const ASTCreateQuery>();
-    if (!create || !create->storage || !create->storage->engine)
-        return {};
-
-    /// Check if the table engine is one of the ReplicatedMergeTree family.
-    const auto & ast_engine = *create->storage->engine;
-    if (!ast_engine.name.starts_with("Replicated") || !ast_engine.name.ends_with("MergeTree"))
-        return {};
-
-    /// Get the first argument.
-    const auto * ast_arguments = typeid_cast<ASTExpressionList *>(ast_engine.arguments.get());
-    if (!ast_arguments || ast_arguments->children.empty())
-        return {};
-
-    auto * ast_zk_path = typeid_cast<ASTLiteral *>(ast_arguments->children[0].get());
-    if (!ast_zk_path || (ast_zk_path->value.getType() != Field::Types::String))
-        return {};
-
-    String zk_path = ast_zk_path->value.safeGet<String>();
-
-    /// Expand macros.
-    Macros::MacroExpansionInfo info;
-    info.table_id.table_name = create->getTable();
-    info.table_id.database_name = create->getDatabase();
-    info.table_id.uuid = create->uuid;
-    auto database = DatabaseCatalog::instance().tryGetDatabase(info.table_id.database_name);
-    if (database && database->getEngineName() == "Replicated")
-    {
-        info.shard = getReplicatedDatabaseShardName(database);
-        info.replica = getReplicatedDatabaseReplicaName(database);
-    }
-
-    try
-    {
-        zk_path = global_context->getMacros()->expand(zk_path, info);
-    }
-    catch (...)
-    {
-        return {}; /// Couldn't expand macros.
-    }
-
-    return zk_path;
-}
-
-}
diff --git a/src/Storages/MergeTree/extractZkPathFromCreateQuery.h b/src/Storages/MergeTree/extractZkPathFromCreateQuery.h
deleted file mode 100644
index e22f76d2cd5..00000000000
--- a/src/Storages/MergeTree/extractZkPathFromCreateQuery.h
+++ /dev/null
@@ -1,19 +0,0 @@
-#pragma once
-
-#include <base/types.h>
-#include <memory>
-#include <optional>
-
-
-namespace DB
-{
-class IAST;
-class Context;
-using ContextPtr = std::shared_ptr<const Context>;
-
-/// Extracts a zookeeper path from a specified CREATE TABLE query. Returns std::nullopt if fails.
-/// The function takes the first argument of the ReplicatedMergeTree table engine and expands macros in it.
-/// It works like a part of what the create() function in registerStorageMergeTree.cpp does but in a simpler manner.
-std::optional<String> tryExtractZkPathFromCreateQuery(const IAST & create_query, const ContextPtr & global_context);
-
-}
diff --git a/src/Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h b/src/Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h
new file mode 100644
index 00000000000..1bd58392201
--- /dev/null
+++ b/src/Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h
@@ -0,0 +1,18 @@
+#pragma once
+
+#include <base/types.h>
+#include <memory>
+#include <optional>
+
+
+namespace DB
+{
+class ASTCreateQuery;
+class Context;
+using ContextPtr = std::shared_ptr<const Context>;
+
+/// Extracts a zookeeper path from a specified CREATE TABLE query. Returns std::nullopt if fails.
+/// The function checks the table engine and if it is Replicated*MergeTree then it takes the first argument and expands macros in it.
+std::optional<String> extractZooKeeperPathFromReplicatedTableDef(const ASTCreateQuery & create_query, const ContextPtr & context);
+
+}
diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index d552a4b6fa5..9b0200d5a1c 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -1,6 +1,7 @@
 #include <Databases/DatabaseReplicatedHelpers.h>
 #include <Storages/MergeTree/MergeTreeIndexMinMax.h>
 #include <Storages/MergeTree/MergeTreeIndices.h>
+#include <Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h>
 #include <Storages/StorageFactory.h>
 #include <Storages/StorageMergeTree.h>
 #include <Storages/StorageReplicatedMergeTree.h>
@@ -122,6 +123,248 @@ static void verifySortingKey(const KeyDescription & sorting_key)
     }
 }
 
+/// Returns whether a new syntax is used to define a table engine, i.e. MergeTree() PRIMARY KEY ... PARTITION BY ... SETTINGS ...
+/// instead of MergeTree(MergeTree(date, [sample_key], primary_key).
+static bool isExtendedStorageDef(const ASTCreateQuery & query)
+{
+    if (query.storage && query.storage->isExtendedStorageDefinition())
+        return true;
+
+    if (query.columns_list &&
+        ((query.columns_list->indices && !query.columns_list->indices->children.empty()) ||
+         (query.columns_list->projections && !query.columns_list->projections->children.empty())))
+    {
+        return true;
+    }
+
+    return false;
+}
+
+/// Evaluates expressions in engine arguments.
+/// In new syntax an argument can be literal or identifier or array/tuple of identifiers.
+static void evaluateEngineArgs(ASTs & engine_args, const ContextPtr & context)
+{
+    size_t arg_idx = 0;
+    try
+    {
+        for (; arg_idx < engine_args.size(); ++arg_idx)
+        {
+            auto & arg = engine_args[arg_idx];
+            auto * arg_func = arg->as<ASTFunction>();
+            if (!arg_func)
+                continue;
+
+            /// If we got ASTFunction, let's evaluate it and replace with ASTLiteral.
+            /// Do not try evaluate array or tuple, because it's array or tuple of column identifiers.
+            if (arg_func->name == "array" || arg_func->name == "tuple")
+                continue;
+            Field value = evaluateConstantExpression(arg, context).first;
+            arg = std::make_shared<ASTLiteral>(value);
+        }
+    }
+    catch (Exception & e)
+    {
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot evaluate engine argument {}: {} {}",
+                        arg_idx, e.message(), verbose_help_message);
+    }
+}
+
+/// Returns whether this is a Replicated table engine?
+static bool isReplicated(const String & engine_name)
+{
+    return engine_name.starts_with("Replicated") && engine_name.ends_with("MergeTree");
+}
+
+/// Returns the part of the name of a table engine between "Replicated" (if any) and "MergeTree".
+static std::string_view getNamePart(const String & engine_name)
+{
+    std::string_view name_part = engine_name;
+    if (name_part.starts_with("Replicated"))
+        name_part.remove_prefix(strlen("Replicated"));
+
+    if (name_part.ends_with("MergeTree"))
+        name_part.remove_suffix(strlen("MergeTree"));
+
+    return name_part;
+}
+
+/// Extracts zookeeper path and replica name from the table engine's arguments.
+/// The function can modify those arguments (that's why they're passed separately in `engine_args`) and also determines RenamingRestrictions.
+/// The function assumes the table engine is Replicated.
+static void extractZooKeeperPathAndReplicaNameFromEngineArgs(
+    const ASTCreateQuery & query,
+    const StorageID & table_id,
+    const String & engine_name,
+    ASTs & engine_args,
+    LoadingStrictnessLevel mode,
+    const ContextPtr & context,
+    String & zookeeper_path,
+    String & replica_name,
+    RenamingRestrictions & renaming_restrictions)
+{
+    chassert(isReplicated(engine_name));
+
+    zookeeper_path = "";
+    replica_name = "";
+    renaming_restrictions = RenamingRestrictions::ALLOW_ANY;
+
+    bool is_extended_storage_def = isExtendedStorageDef(query);
+
+    if (is_extended_storage_def)
+    {
+        /// Allow expressions in engine arguments.
+        /// In new syntax argument can be literal or identifier or array/tuple of identifiers.
+        evaluateEngineArgs(engine_args, context);
+    }
+
+    bool is_on_cluster = context->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY;
+    bool is_replicated_database = context->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY &&
+        DatabaseCatalog::instance().getDatabase(table_id.database_name)->getEngineName() == "Replicated";
+
+    /// Allow implicit {uuid} macros only for zookeeper_path in ON CLUSTER queries
+    /// and if UUID was explicitly passed in CREATE TABLE (like for ATTACH)
+    bool allow_uuid_macro = is_on_cluster || is_replicated_database || query.attach || query.has_uuid;
+
+    auto expand_macro = [&] (ASTLiteral * ast_zk_path, ASTLiteral * ast_replica_name)
+    {
+        /// Unfold {database} and {table} macro on table creation, so table can be renamed.
+        if (mode < LoadingStrictnessLevel::ATTACH)
+        {
+            Macros::MacroExpansionInfo info;
+            /// NOTE: it's not recursive
+            info.expand_special_macros_only = true;
+            info.table_id = table_id;
+            /// Avoid unfolding {uuid} macro on this step.
+            /// We did unfold it in previous versions to make moving table from Atomic to Ordinary database work correctly,
+            /// but now it's not allowed (and it was the only reason to unfold {uuid} macro).
+            info.table_id.uuid = UUIDHelpers::Nil;
+            zookeeper_path = context->getMacros()->expand(zookeeper_path, info);
+
+            info.level = 0;
+            replica_name = context->getMacros()->expand(replica_name, info);
+        }
+
+        ast_zk_path->value = zookeeper_path;
+        ast_replica_name->value = replica_name;
+
+        /// Expand other macros (such as {shard} and {replica}). We do not expand them on previous step
+        /// to make possible copying metadata files between replicas.
+        Macros::MacroExpansionInfo info;
+        info.table_id = table_id;
+        if (is_replicated_database)
+        {
+            auto database = DatabaseCatalog::instance().getDatabase(table_id.database_name);
+            info.shard = getReplicatedDatabaseShardName(database);
+            info.replica = getReplicatedDatabaseReplicaName(database);
+        }
+        if (!allow_uuid_macro)
+            info.table_id.uuid = UUIDHelpers::Nil;
+        zookeeper_path = context->getMacros()->expand(zookeeper_path, info);
+
+        info.level = 0;
+        info.table_id.uuid = UUIDHelpers::Nil;
+        replica_name = context->getMacros()->expand(replica_name, info);
+
+        /// We do not allow renaming table with these macros in metadata, because zookeeper_path will be broken after RENAME TABLE.
+        /// NOTE: it may happen if table was created by older version of ClickHouse (< 20.10) and macros was not unfolded on table creation
+        /// or if one of these macros is recursively expanded from some other macro.
+        /// Also do not allow to move table from Atomic to Ordinary database if there's {uuid} macro
+        if (info.expanded_database || info.expanded_table)
+            renaming_restrictions = RenamingRestrictions::DO_NOT_ALLOW;
+        else if (info.expanded_uuid)
+            renaming_restrictions = RenamingRestrictions::ALLOW_PRESERVING_UUID;
+    };
+
+    size_t arg_num = 0;
+    size_t arg_cnt = engine_args.size();
+
+    bool has_arguments = (arg_num + 2 <= arg_cnt);
+    bool has_valid_arguments = has_arguments && engine_args[arg_num]->as<ASTLiteral>() && engine_args[arg_num + 1]->as<ASTLiteral>();
+
+    if (has_valid_arguments)
+    {
+        /// Get path and name from engine arguments
+        auto * ast_zk_path = engine_args[arg_num]->as<ASTLiteral>();
+        if (ast_zk_path && ast_zk_path->value.getType() == Field::Types::String)
+            zookeeper_path = ast_zk_path->value.safeGet<String>();
+        else
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Path in ZooKeeper must be a string literal{}", verbose_help_message);
+
+        auto * ast_replica_name = engine_args[arg_num + 1]->as<ASTLiteral>();
+        if (ast_replica_name && ast_replica_name->value.getType() == Field::Types::String)
+            replica_name = ast_replica_name->value.safeGet<String>();
+        else
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Replica name must be a string literal{}", verbose_help_message);
+
+        if (replica_name.empty())
+            throw Exception(ErrorCodes::NO_REPLICA_NAME_GIVEN, "No replica name in config{}", verbose_help_message);
+
+        expand_macro(ast_zk_path, ast_replica_name);
+    }
+    else if (is_extended_storage_def
+        && (arg_cnt == 0
+            || !engine_args[arg_num]->as<ASTLiteral>()
+            || (arg_cnt == 1 && (getNamePart(engine_name) == "Graphite"))))
+    {
+        /// Try use default values if arguments are not specified.
+        /// Note: {uuid} macro works for ON CLUSTER queries when database engine is Atomic.
+        const auto & server_settings = context->getServerSettings();
+        zookeeper_path = server_settings.default_replica_path;
+        /// TODO maybe use hostname if {replica} is not defined?
+        replica_name = server_settings.default_replica_name;
+
+        /// Modify query, so default values will be written to metadata
+        assert(arg_num == 0);
+        ASTs old_args;
+        std::swap(engine_args, old_args);
+        auto path_arg = std::make_shared<ASTLiteral>(zookeeper_path);
+        auto name_arg = std::make_shared<ASTLiteral>(replica_name);
+        auto * ast_zk_path = path_arg.get();
+        auto * ast_replica_name = name_arg.get();
+
+        expand_macro(ast_zk_path, ast_replica_name);
+
+        engine_args.emplace_back(std::move(path_arg));
+        engine_args.emplace_back(std::move(name_arg));
+        std::move(std::begin(old_args), std::end(old_args), std::back_inserter(engine_args));
+    }
+    else
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected two string literal arguments: zookeeper_path and replica_name");
+}
+
+/// Extracts a zookeeper path from a specified CREATE TABLE query. Returns std::nullopt if fails.
+std::optional<String> extractZooKeeperPathFromReplicatedTableDef(const ASTCreateQuery & query, const ContextPtr & context)
+{
+    try
+    {
+        if (!query.storage || !query.storage->engine)
+            return {};
+
+        const String & engine_name = query.storage->engine->name;
+        if (!isReplicated(engine_name))
+            return {};
+
+        StorageID table_id{query.getDatabase(), query.getTable(), query.uuid};
+        ASTs engine_args;
+        if (query.storage->engine->arguments)
+            engine_args = query.storage->engine->arguments->children;
+        for (auto & engine_arg : engine_args)
+            engine_arg = engine_arg->clone();
+        LoadingStrictnessLevel mode = LoadingStrictnessLevel::CREATE;
+        String zookeeper_path;
+        String replica_name;
+        RenamingRestrictions renaming_restrictions;
+
+        extractZooKeeperPathAndReplicaNameFromEngineArgs(query, table_id, engine_name, engine_args, mode, context,
+                                                         zookeeper_path, replica_name, renaming_restrictions);
+
+        return zookeeper_path;
+    }
+    catch (...)
+    {
+        return {};
+    }
+}
 
 static StoragePtr create(const StorageFactory::Arguments & args)
 {
@@ -156,17 +399,12 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         *  - Additional MergeTreeSettings in the SETTINGS clause;
         */
 
-    bool is_extended_storage_def = args.storage_def->isExtendedStorageDefinition()
-        || (args.query.columns_list->indices && !args.query.columns_list->indices->children.empty())
-        || (args.query.columns_list->projections && !args.query.columns_list->projections->children.empty());
+    bool is_extended_storage_def = isExtendedStorageDef(args.query);
 
     const Settings & local_settings = args.getLocalContext()->getSettingsRef();
 
-    String name_part = args.engine_name.substr(0, args.engine_name.size() - strlen("MergeTree"));
-
-    bool replicated = startsWith(name_part, "Replicated");
-    if (replicated)
-        name_part = name_part.substr(strlen("Replicated"));
+    bool replicated = isReplicated(args.engine_name);
+    std::string_view name_part = getNamePart(args.engine_name);
 
     MergeTreeData::MergingParams merging_params;
     merging_params.mode = MergeTreeData::MergingParams::Ordinary;
@@ -283,29 +521,7 @@ static StoragePtr create(const StorageFactory::Arguments & args)
     {
         /// Allow expressions in engine arguments.
         /// In new syntax argument can be literal or identifier or array/tuple of identifiers.
-        size_t arg_idx = 0;
-        try
-        {
-            for (; arg_idx < engine_args.size(); ++arg_idx)
-            {
-                auto & arg = engine_args[arg_idx];
-                auto * arg_func = arg->as<ASTFunction>();
-                if (!arg_func)
-                    continue;
-
-                /// If we got ASTFunction, let's evaluate it and replace with ASTLiteral.
-                /// Do not try evaluate array or tuple, because it's array or tuple of column identifiers.
-                if (arg_func->name == "array" || arg_func->name == "tuple")
-                    continue;
-                Field value = evaluateConstantExpression(arg, args.getLocalContext()).first;
-                arg = std::make_shared<ASTLiteral>(value);
-            }
-        }
-        catch (Exception & e)
-        {
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot evaluate engine argument {}: {} {}",
-                            arg_idx, e.message(), verbose_help_message);
-        }
+        evaluateEngineArgs(engine_args, args.getLocalContext());
     }
     else if (args.mode <= LoadingStrictnessLevel::CREATE && !local_settings.allow_deprecated_syntax_for_merge_tree)
     {
@@ -314,130 +530,17 @@ static StoragePtr create(const StorageFactory::Arguments & args)
                                                    "See also `allow_deprecated_syntax_for_merge_tree` setting.");
     }
 
-    /// For Replicated.
+    /// Extract zookeeper path and replica name from engine arguments.
     String zookeeper_path;
     String replica_name;
     RenamingRestrictions renaming_restrictions = RenamingRestrictions::ALLOW_ANY;
 
-    bool is_on_cluster = args.getLocalContext()->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY;
-    bool is_replicated_database = args.getLocalContext()->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY &&
-        DatabaseCatalog::instance().getDatabase(args.table_id.database_name)->getEngineName() == "Replicated";
-
-    /// Allow implicit {uuid} macros only for zookeeper_path in ON CLUSTER queries
-    /// and if UUID was explicitly passed in CREATE TABLE (like for ATTACH)
-    bool allow_uuid_macro = is_on_cluster || is_replicated_database || args.query.attach || args.query.has_uuid;
-
-    auto expand_macro = [&] (ASTLiteral * ast_zk_path, ASTLiteral * ast_replica_name)
-    {
-        /// Unfold {database} and {table} macro on table creation, so table can be renamed.
-        if (args.mode < LoadingStrictnessLevel::ATTACH)
-        {
-            Macros::MacroExpansionInfo info;
-            /// NOTE: it's not recursive
-            info.expand_special_macros_only = true;
-            info.table_id = args.table_id;
-            /// Avoid unfolding {uuid} macro on this step.
-            /// We did unfold it in previous versions to make moving table from Atomic to Ordinary database work correctly,
-            /// but now it's not allowed (and it was the only reason to unfold {uuid} macro).
-            info.table_id.uuid = UUIDHelpers::Nil;
-            zookeeper_path = context->getMacros()->expand(zookeeper_path, info);
-
-            info.level = 0;
-            replica_name = context->getMacros()->expand(replica_name, info);
-        }
-
-        ast_zk_path->value = zookeeper_path;
-        ast_replica_name->value = replica_name;
-
-        /// Expand other macros (such as {shard} and {replica}). We do not expand them on previous step
-        /// to make possible copying metadata files between replicas.
-        Macros::MacroExpansionInfo info;
-        info.table_id = args.table_id;
-        if (is_replicated_database)
-        {
-            auto database = DatabaseCatalog::instance().getDatabase(args.table_id.database_name);
-            info.shard = getReplicatedDatabaseShardName(database);
-            info.replica = getReplicatedDatabaseReplicaName(database);
-        }
-        if (!allow_uuid_macro)
-            info.table_id.uuid = UUIDHelpers::Nil;
-        zookeeper_path = context->getMacros()->expand(zookeeper_path, info);
-
-        info.level = 0;
-        info.table_id.uuid = UUIDHelpers::Nil;
-        replica_name = context->getMacros()->expand(replica_name, info);
-
-        /// We do not allow renaming table with these macros in metadata, because zookeeper_path will be broken after RENAME TABLE.
-        /// NOTE: it may happen if table was created by older version of ClickHouse (< 20.10) and macros was not unfolded on table creation
-        /// or if one of these macros is recursively expanded from some other macro.
-        /// Also do not allow to move table from Atomic to Ordinary database if there's {uuid} macro
-        if (info.expanded_database || info.expanded_table)
-            renaming_restrictions = RenamingRestrictions::DO_NOT_ALLOW;
-        else if (info.expanded_uuid)
-            renaming_restrictions = RenamingRestrictions::ALLOW_PRESERVING_UUID;
-    };
-
     if (replicated)
     {
-        bool has_arguments = arg_num + 2 <= arg_cnt;
-        bool has_valid_arguments = has_arguments && engine_args[arg_num]->as<ASTLiteral>() && engine_args[arg_num + 1]->as<ASTLiteral>();
-
-        ASTLiteral * ast_zk_path;
-        ASTLiteral * ast_replica_name;
-
-        if (has_valid_arguments)
-        {
-            /// Get path and name from engine arguments
-            ast_zk_path = engine_args[arg_num]->as<ASTLiteral>();
-            if (ast_zk_path && ast_zk_path->value.getType() == Field::Types::String)
-                zookeeper_path = ast_zk_path->value.safeGet<String>();
-            else
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Path in ZooKeeper must be a string literal{}", verbose_help_message);
-            ++arg_num;
-
-            ast_replica_name = engine_args[arg_num]->as<ASTLiteral>();
-            if (ast_replica_name && ast_replica_name->value.getType() == Field::Types::String)
-                replica_name = ast_replica_name->value.safeGet<String>();
-            else
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Replica name must be a string literal{}", verbose_help_message);
-
-            if (replica_name.empty())
-                throw Exception(ErrorCodes::NO_REPLICA_NAME_GIVEN, "No replica name in config{}", verbose_help_message);
-            ++arg_num;
-
-            expand_macro(ast_zk_path, ast_replica_name);
-        }
-        else if (is_extended_storage_def
-            && (arg_cnt == 0
-                || !engine_args[arg_num]->as<ASTLiteral>()
-                || (arg_cnt == 1 && merging_params.mode == MergeTreeData::MergingParams::Graphite)))
-        {
-            /// Try use default values if arguments are not specified.
-            /// Note: {uuid} macro works for ON CLUSTER queries when database engine is Atomic.
-            const auto & server_settings = args.getContext()->getServerSettings();
-            zookeeper_path = server_settings.default_replica_path;
-            /// TODO maybe use hostname if {replica} is not defined?
-            replica_name = server_settings.default_replica_name;
-
-            /// Modify query, so default values will be written to metadata
-            assert(arg_num == 0);
-            ASTs old_args;
-            std::swap(engine_args, old_args);
-            auto path_arg = std::make_shared<ASTLiteral>(zookeeper_path);
-            auto name_arg = std::make_shared<ASTLiteral>(replica_name);
-            ast_zk_path = path_arg.get();
-            ast_replica_name = name_arg.get();
-
-            expand_macro(ast_zk_path, ast_replica_name);
-
-            engine_args.emplace_back(std::move(path_arg));
-            engine_args.emplace_back(std::move(name_arg));
-            std::move(std::begin(old_args), std::end(old_args), std::back_inserter(engine_args));
-            arg_num = 2;
-            arg_cnt += 2;
-        }
-        else
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected two string literal arguments: zookeeper_path and replica_name");
+        extractZooKeeperPathAndReplicaNameFromEngineArgs(args.query, args.table_id, args.engine_name, args.engine_args, args.mode,
+                                                         args.getLocalContext(), zookeeper_path, replica_name, renaming_restrictions);
+        arg_cnt = engine_args.size(); /// Update `arg_cnt` here because extractZooKeeperPathAndReplicaNameFromEngineArgs() could add arguments.
+        arg_num = 2;                  /// zookeeper_path and replica_name together are always two arguments.
     }
 
     /// This merging param maybe used as part of sorting key
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 58d1846915f..0639b172d31 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -31,7 +31,6 @@
 #include <Storages/ColumnsDescription.h>
 #include <Storages/Freeze.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
-#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Storages/MergeTree/LeaderElection.h>
 #include <Storages/MergeTree/MergedBlockOutputStream.h>

From faae8a4f2b683eed530b74f92ab58d1a76b5d001 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Wed, 24 Apr 2024 20:37:06 +0200
Subject: [PATCH 065/289] Add tests for backup on cluster with 2 shards and 2
 replicas.

---
 .../configs/cluster_2x2.xml                   |  26 +++
 .../test_backup_restore_on_cluster/test.py    |   1 -
 .../test_two_shards_two_replicas.py           | 153 ++++++++++++++++++
 3 files changed, 179 insertions(+), 1 deletion(-)
 create mode 100644 tests/integration/test_backup_restore_on_cluster/configs/cluster_2x2.xml
 create mode 100644 tests/integration/test_backup_restore_on_cluster/test_two_shards_two_replicas.py

diff --git a/tests/integration/test_backup_restore_on_cluster/configs/cluster_2x2.xml b/tests/integration/test_backup_restore_on_cluster/configs/cluster_2x2.xml
new file mode 100644
index 00000000000..97e60fbbed7
--- /dev/null
+++ b/tests/integration/test_backup_restore_on_cluster/configs/cluster_2x2.xml
@@ -0,0 +1,26 @@
+<clickhouse>
+    <remote_servers>
+        <cluster_2x2>
+            <shard>
+                <replica>
+                    <host>node_1_1</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>node_1_2</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+            <shard>
+                <replica>
+                    <host>node_2_1</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>node_2_2</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </cluster_2x2>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_backup_restore_on_cluster/test.py b/tests/integration/test_backup_restore_on_cluster/test.py
index d1520444df1..700ed6f15f5 100644
--- a/tests/integration/test_backup_restore_on_cluster/test.py
+++ b/tests/integration/test_backup_restore_on_cluster/test.py
@@ -41,7 +41,6 @@ node2 = cluster.add_instance(
     stay_alive=True,  # Necessary for the "test_stop_other_host_while_backup" test
 )
 
-
 node3 = cluster.add_instance(
     "node3",
     main_configs=main_configs,
diff --git a/tests/integration/test_backup_restore_on_cluster/test_two_shards_two_replicas.py b/tests/integration/test_backup_restore_on_cluster/test_two_shards_two_replicas.py
new file mode 100644
index 00000000000..c0e318c8bb7
--- /dev/null
+++ b/tests/integration/test_backup_restore_on_cluster/test_two_shards_two_replicas.py
@@ -0,0 +1,153 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import TSV
+
+
+cluster = ClickHouseCluster(__file__)
+
+main_configs = [
+    "configs/backups_disk.xml",
+    "configs/cluster_2x2.xml",
+    "configs/lesser_timeouts.xml",  # Default timeouts are quite big (a few minutes), the tests don't need them to be that big.
+]
+
+user_configs = [
+    "configs/zookeeper_retries.xml",
+]
+
+node_1_1 = cluster.add_instance(
+    "node_1_1",
+    main_configs=main_configs,
+    user_configs=user_configs,
+    external_dirs=["/backups/"],
+    macros={"replica": "1", "shard": "1"},
+    with_zookeeper=True,
+)
+
+node_1_2 = cluster.add_instance(
+    "node_1_2",
+    main_configs=main_configs,
+    user_configs=user_configs,
+    external_dirs=["/backups/"],
+    macros={"replica": "2", "shard": "1"},
+    with_zookeeper=True,
+)
+
+node_2_1 = cluster.add_instance(
+    "node_2_1",
+    main_configs=main_configs,
+    user_configs=user_configs,
+    external_dirs=["/backups/"],
+    macros={"replica": "1", "shard": "2"},
+    with_zookeeper=True,
+)
+
+node_2_2 = cluster.add_instance(
+    "node_2_2",
+    main_configs=main_configs,
+    user_configs=user_configs,
+    external_dirs=["/backups/"],
+    macros={"replica": "2", "shard": "2"},
+    with_zookeeper=True,
+)
+
+
+@pytest.fixture(scope="module", autouse=True)
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+@pytest.fixture(autouse=True)
+def drop_after_test():
+    try:
+        yield
+    finally:
+        node_1_1.query("DROP TABLE IF EXISTS tbl ON CLUSTER 'cluster_2x2' SYNC")
+        node_1_1.query("DROP TABLE IF EXISTS table_a ON CLUSTER 'cluster_2x2' SYNC")
+        node_1_1.query("DROP TABLE IF EXISTS table_b ON CLUSTER 'cluster_2x2' SYNC")
+
+
+backup_id_counter = 0
+
+
+def new_backup_name():
+    global backup_id_counter
+    backup_id_counter += 1
+    return f"Disk('backups', '{backup_id_counter}')"
+
+
+def test_replicated_table():
+    node_1_1.query(
+        "CREATE TABLE tbl ON CLUSTER 'cluster_2x2' ("
+        "x Int64"
+        ") ENGINE=ReplicatedMergeTree('/clickhouse/tables/tbl/{shard}', '{replica}')"
+        "ORDER BY x"
+    )
+
+    node_1_1.query("INSERT INTO tbl VALUES (100), (200)")
+    node_2_1.query("INSERT INTO tbl VALUES (300), (400)")
+
+    backup_name = new_backup_name()
+
+    node_1_1.query(f"BACKUP TABLE tbl ON CLUSTER 'cluster_2x2' TO {backup_name}")
+
+    node_1_1.query(f"DROP TABLE tbl ON CLUSTER 'cluster_2x2' SYNC")
+
+    node_1_1.query(f"RESTORE ALL ON CLUSTER 'cluster_2x2' FROM {backup_name}")
+
+    node_1_1.query("SYSTEM SYNC REPLICA ON CLUSTER 'cluster_2x2' tbl")
+
+    assert node_1_1.query("SELECT * FROM tbl ORDER BY x") == TSV([[100], [200]])
+    assert node_1_2.query("SELECT * FROM tbl ORDER BY x") == TSV([[100], [200]])
+    assert node_2_1.query("SELECT * FROM tbl ORDER BY x") == TSV([[300], [400]])
+    assert node_2_2.query("SELECT * FROM tbl ORDER BY x") == TSV([[300], [400]])
+
+
+def test_two_tables_with_uuid_in_zk_path():
+    node_1_1.query(
+        "CREATE TABLE table_a ON CLUSTER 'cluster_2x2' ("
+        "x Int64"
+        ") ENGINE=ReplicatedMergeTree('/clickhouse/tables/{uuid}/{shard}', '{replica}')"
+        "ORDER BY x"
+    )
+
+    node_1_1.query(
+        "CREATE TABLE table_b ON CLUSTER 'cluster_2x2' ("
+        "x Int64"
+        ") ENGINE=ReplicatedMergeTree('/clickhouse/tables/{uuid}/{shard}', '{replica}')"
+        "ORDER BY x"
+    )
+
+    node_1_1.query("INSERT INTO table_a VALUES (100), (200)")
+    node_2_1.query("INSERT INTO table_a VALUES (300), (400)")
+
+    node_1_2.query("INSERT INTO table_b VALUES (500), (600)")
+    node_2_2.query("INSERT INTO table_b VALUES (700), (800)")
+
+    backup_name = new_backup_name()
+
+    node_1_1.query(
+        f"BACKUP TABLE table_a, TABLE table_b ON CLUSTER 'cluster_2x2' TO {backup_name}"
+    )
+
+    node_1_1.query(f"DROP TABLE table_a ON CLUSTER 'cluster_2x2' SYNC")
+    node_1_1.query(f"DROP TABLE table_b ON CLUSTER 'cluster_2x2' SYNC")
+
+    node_1_1.query(f"RESTORE ALL ON CLUSTER 'cluster_2x2' FROM {backup_name}")
+
+    node_1_1.query("SYSTEM SYNC REPLICA ON CLUSTER 'cluster_2x2' table_a")
+    node_1_1.query("SYSTEM SYNC REPLICA ON CLUSTER 'cluster_2x2' table_b")
+
+    assert node_1_1.query("SELECT * FROM table_a ORDER BY x") == TSV([[100], [200]])
+    assert node_1_2.query("SELECT * FROM table_a ORDER BY x") == TSV([[100], [200]])
+    assert node_2_1.query("SELECT * FROM table_a ORDER BY x") == TSV([[300], [400]])
+    assert node_2_2.query("SELECT * FROM table_a ORDER BY x") == TSV([[300], [400]])
+
+    assert node_1_1.query("SELECT * FROM table_b ORDER BY x") == TSV([[500], [600]])
+    assert node_1_2.query("SELECT * FROM table_b ORDER BY x") == TSV([[500], [600]])
+    assert node_2_1.query("SELECT * FROM table_b ORDER BY x") == TSV([[700], [800]])
+    assert node_2_2.query("SELECT * FROM table_b ORDER BY x") == TSV([[700], [800]])

From bff72f3b2753e88aaa1b703258ad904ad11fc4ee Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Fri, 26 Apr 2024 09:06:17 +0000
Subject: [PATCH 066/289] batter

---
 src/Functions/clamp.cpp                   | 2 +-
 tests/queries/0_stateless/03036_clamp.sql | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/clamp.cpp b/src/Functions/clamp.cpp
index 3438377afbf..448711aed27 100644
--- a/src/Functions/clamp.cpp
+++ b/src/Functions/clamp.cpp
@@ -47,7 +47,7 @@ public:
         for (size_t row_num = 0; row_num < input_rows_count; ++row_num)
         {
             if (converted_columns[1]->compareAt(row_num, row_num, *converted_columns[2], 1) > 0)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Function {} the minimum value cannot be greater than the maximum value", getName());
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The minimum value cannot be greater than the maximum value for function {}", getName());
 
             size_t best_arg = 0;
             if (converted_columns[1]->compareAt(row_num, row_num, *converted_columns[best_arg], 1) > 0)
diff --git a/tests/queries/0_stateless/03036_clamp.sql b/tests/queries/0_stateless/03036_clamp.sql
index d225be63f46..0ca1f99572a 100644
--- a/tests/queries/0_stateless/03036_clamp.sql
+++ b/tests/queries/0_stateless/03036_clamp.sql
@@ -10,6 +10,6 @@ select clamp(1, null, 5);
 select clamp(1, 6, null);
 select clamp(1, 5, nan);
 select clamp(toInt64(number), toInt64(number-1), toInt64(number+1)) from numbers(3);
-select clamp(number, number-1, number+1) from numbers(3);   -- { serverError 386 }
-select clamp(1, 3, 2);   -- { serverError 36 } 
+select clamp(number, number-1, number+1) from numbers(3);   -- { serverError NO_COMMON_TYPE }
+select clamp(1, 3, 2);   -- { serverError BAD_ARGUMENTS } 
 select clamp(1, data[1], data[2])from (select arrayJoin([[1, 2], [2,3], [3,2], [4, 4]]) as data);   -- { serverError 36 } 

From fb375e7a74826a6741df24999936147606ea9c8d Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Mon, 29 Apr 2024 14:59:31 +0200
Subject: [PATCH 067/289] Apply suggestions from code review

---
 src/Functions/clamp.cpp                   | 3 +--
 tests/queries/0_stateless/03036_clamp.sql | 2 +-
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/Functions/clamp.cpp b/src/Functions/clamp.cpp
index 448711aed27..bb347a575e4 100644
--- a/src/Functions/clamp.cpp
+++ b/src/Functions/clamp.cpp
@@ -22,8 +22,7 @@ public:
     static constexpr auto name = "clamp";
 
     String getName() const override { return name; }
-    size_t getNumberOfArguments() const override { return 0; }
-    bool isVariadic() const override { return true; }
+    size_t getNumberOfArguments() const override { return 3; }
     bool useDefaultImplementationForConstants() const override { return true; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
     static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionClamp>(); }
diff --git a/tests/queries/0_stateless/03036_clamp.sql b/tests/queries/0_stateless/03036_clamp.sql
index 0ca1f99572a..9973265c13b 100644
--- a/tests/queries/0_stateless/03036_clamp.sql
+++ b/tests/queries/0_stateless/03036_clamp.sql
@@ -12,4 +12,4 @@ select clamp(1, 5, nan);
 select clamp(toInt64(number), toInt64(number-1), toInt64(number+1)) from numbers(3);
 select clamp(number, number-1, number+1) from numbers(3);   -- { serverError NO_COMMON_TYPE }
 select clamp(1, 3, 2);   -- { serverError BAD_ARGUMENTS } 
-select clamp(1, data[1], data[2])from (select arrayJoin([[1, 2], [2,3], [3,2], [4, 4]]) as data);   -- { serverError 36 } 
+select clamp(1, data[1], data[2])from (select arrayJoin([[1, 2], [2,3], [3,2], [4, 4]]) as data);   -- { serverError BAD_ARGUMENTS } 

From 155866b262e9cd3123b23522ea8bda301b514233 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Mon, 29 Apr 2024 13:47:08 +0000
Subject: [PATCH 068/289] CI: try separate wf file for MQ

---
 .github/workflows/merge_queue.yml  | 97 ++++++++++++++++++++++++++++++
 .github/workflows/pull_request.yml | 33 +++++-----
 2 files changed, 113 insertions(+), 17 deletions(-)
 create mode 100644 .github/workflows/merge_queue.yml

diff --git a/.github/workflows/merge_queue.yml b/.github/workflows/merge_queue.yml
new file mode 100644
index 00000000000..2b820926651
--- /dev/null
+++ b/.github/workflows/merge_queue.yml
@@ -0,0 +1,97 @@
+# yamllint disable rule:comments-indentation
+name: MergeQueueCI
+
+env:
+  # Force the stdout and stderr streams to be unbuffered
+  PYTHONUNBUFFERED: 1
+
+on:  # yamllint disable-line rule:truthy
+  merge_group:
+
+jobs:
+  RunConfig:
+    runs-on: [self-hosted, style-checker-aarch64]
+    outputs:
+      data: ${{ steps.runconfig.outputs.CI_DATA }}
+    steps:
+      - name: GH event json
+        run: |
+          cat "$GITHUB_EVENT_PATH" ||:
+      - name: Check out repository code
+        uses: ClickHouse/checkout@v1
+        with:
+          clear-repository: true # to ensure correct digests
+          fetch-depth: 0 # to get version
+          filter: tree:0
+      - name: Python unit tests
+        run: |
+          cd "$GITHUB_WORKSPACE/tests/ci"
+          echo "Testing the main ci directory"
+          python3 -m unittest discover -s . -p 'test_*.py'
+          for dir in *_lambda/; do
+            echo "Testing $dir"
+            python3 -m unittest discover -s "$dir" -p 'test_*.py'
+          done
+      - name: PrepareRunConfig
+        id: runconfig
+        run: |
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --outfile ${{ runner.temp }}/ci_run_data.json
+
+            echo "::group::CI configuration"
+            python3 -m json.tool ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+
+            {
+              echo 'CI_DATA<<EOF'
+              cat  ${{ runner.temp }}/ci_run_data.json
+              echo 'EOF'
+            } >> "$GITHUB_OUTPUT"
+  BuildDockers:
+    needs: [RunConfig]
+    if: ${{ !failure() && !cancelled() && toJson(fromJson(needs.RunConfig.outputs.data).docker_data.missing_multi) != '[]' }}
+    uses: ./.github/workflows/reusable_docker.yml
+    with:
+      data: ${{ needs.RunConfig.outputs.data }}
+  StyleCheck:
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() && contains(fromJson(needs.RunConfig.outputs.data).jobs_data.jobs_to_do, 'Style check')}}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Style check
+      runner_type: style-checker
+      run_command: |
+          python3 style_check.py
+      data: ${{ needs.RunConfig.outputs.data }}
+    secrets:
+      secret_envs: |
+        ROBOT_CLICKHOUSE_SSH_KEY<<RCSK
+        ${{secrets.ROBOT_CLICKHOUSE_SSH_KEY}}
+        RCSK
+  FastTest:
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() && contains(fromJson(needs.RunConfig.outputs.data).jobs_data.jobs_to_do, 'Fast test') }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Fast test
+      runner_type: builder
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
+          python3 fast_test_check.py
+
+  ################################# Stage Final #################################
+  #
+  FinishCheck:
+    if: ${{ !failure() && !cancelled() }}
+    needs: [RunConfig, BuildDockers, StyleCheck, FastTest]
+    runs-on: [self-hosted, style-checker]
+    steps:
+      - name: Check out repository code
+        uses: ClickHouse/checkout@v1
+      - name: Check sync status
+        run: |
+          cd "$GITHUB_WORKSPACE/tests/ci"
+          python3 sync_pr.py --status
+      - name: Finish label
+        run: |
+          cd "$GITHUB_WORKSPACE/tests/ci"
+          python3 finish_check.py ${{ (contains(needs.*.result, 'failure') && github.event_name == 'merge_group') && '--pipeline-failure' || '' }}
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 5114c260f34..da34ea0b8e8 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -6,7 +6,6 @@ env:
   PYTHONUNBUFFERED: 1
 
 on:  # yamllint disable-line rule:truthy
-  merge_group:
   pull_request:
     types:
       - synchronize
@@ -21,8 +20,14 @@ jobs:
     outputs:
       data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
-      - name: DebugInfo
-        uses: hmarr/debug-action@f7318c783045ac39ed9bb497e22ce835fdafbfe6
+      - name: GH event json
+        run: |
+          echo "::group::GH Env"
+          env | grep GITHUB ||:
+          echo "::endgroup::"
+          echo "::group::Event Json"
+          cat "$GITHUB_EVENT_PATH" ||:
+          echo "::endgroup::"
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
@@ -30,7 +35,6 @@ jobs:
           fetch-depth: 0 # to get version
           filter: tree:0
       - name: Labels check
-        if: ${{ github.event_name != 'merge_group' }}
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
           python3 run_check.py
@@ -58,7 +62,6 @@ jobs:
               echo 'EOF'
             } >> "$GITHUB_OUTPUT"
       - name: Re-create GH statuses for skipped jobs if any
-        if: ${{ github.event_name != 'merge_group' }}
         run: |
             python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ runner.temp }}/ci_run_data.json --update-gh-statuses
   BuildDockers:
@@ -83,7 +86,7 @@ jobs:
         ${{secrets.ROBOT_CLICKHOUSE_SSH_KEY}}
         RCSK
   FastTest:
-    needs: [RunConfig, BuildDockers]
+    needs: [RunConfig, BuildDockers, StyleCheck]
     if: ${{ !failure() && !cancelled() && contains(fromJson(needs.RunConfig.outputs.data).jobs_data.jobs_to_do, 'Fast test') }}
     uses: ./.github/workflows/reusable_test.yml
     with:
@@ -163,20 +166,16 @@ jobs:
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
-      - name: Check sync status
-        if: ${{ github.event_name == 'merge_group' }}
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 sync_pr.py --status
       - name: Finish label
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 finish_check.py ${{ (contains(needs.*.result, 'failure') && github.event_name == 'merge_group') && '--pipeline-failure' || '' }}
-      - name: Auto merge if approved
-        if: ${{ github.event_name != 'merge_group' }}
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 merge_pr.py --check-approved
+          python3 finish_check.py
+      # FIXME: merge on approval does not work with MQ. Could be fixed by using defaul GH's automerge after some corrections in Mergeable Check status
+      # - name: Auto merge if approved
+      #   if: ${{ github.event_name != 'merge_group' }}
+      #   run: |
+      #     cd "$GITHUB_WORKSPACE/tests/ci"
+      #     python3 merge_pr.py --check-approved
 
 
 #############################################################################################

From 8f93df354ec51a6c8393cdeae67016dbb89aa217 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Tue, 30 Apr 2024 20:34:08 +0800
Subject: [PATCH 069/289] fix end symbol

---
 src/Processors/Formats/Impl/NpyOutputFormat.cpp             | 6 +++++-
 tests/queries/0_stateless/02895_npy_output_format.reference | 6 +++---
 2 files changed, 8 insertions(+), 4 deletions(-)

diff --git a/src/Processors/Formats/Impl/NpyOutputFormat.cpp b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
index b3d5042aa79..e02787b4f70 100644
--- a/src/Processors/Formats/Impl/NpyOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/NpyOutputFormat.cpp
@@ -40,7 +40,11 @@ void writeNumpyStrings(const ColumnPtr & column, size_t length, WriteBuffer & bu
 {
     const auto * string_column = assert_cast<const ColumnType *>(column.get());
     for (size_t i = 0; i < string_column->size(); ++i)
-        buf.write(string_column->getDataAt(i).data, length);
+    {
+        auto data = string_column->getDataAt(i);
+        buf.write(data.data, data.size);
+        writeChar(0, length - data.size, buf);
+    }
 }
 
 }
diff --git a/tests/queries/0_stateless/02895_npy_output_format.reference b/tests/queries/0_stateless/02895_npy_output_format.reference
index b599f1dceea..77d9b55ca9f 100644
--- a/tests/queries/0_stateless/02895_npy_output_format.reference
+++ b/tests/queries/0_stateless/02895_npy_output_format.reference
@@ -52,9 +52,9 @@ array	String
 [[0.1],[0.2]]
 [[0.1],[0.2]]
 [[0.1],[0.2]]
-[['abb','bbc'],['ccc','dddd']]
-[['abb','bbc'],['ccc','dddd']]
-[['abb','bbc'],['ccc','dddd']]
+[['a','bb'],['ccc','dddd']]
+[['a','bb'],['ccc','dddd']]
+[['a','bb'],['ccc','dddd']]
 array	Array(Array(Array(Int8)))					
 array	Array(Array(Float64))					
 array	Array(Array(String))					

From 8de80954809435e15aa65ab29fba59230bc1eae5 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Thu, 2 May 2024 11:56:14 +0200
Subject: [PATCH 070/289] Update addXYZ documentation

---
 .../functions/date-time-functions.md          | 468 +++++++++++++++++-
 .../aspell-ignore/en/aspell-dict.txt          |   2 +
 2 files changed, 465 insertions(+), 5 deletions(-)

diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 51f841657d9..629b3ca9305 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -2557,13 +2557,27 @@ Like function `YYYYMMDDhhmmssToDate()` but produces a [DateTime64](../../sql-ref
 
 Accepts an additional, optional `precision` parameter after the `timezone` parameter.
 
-## addYears, addQuarters, addMonths, addWeeks, addDays, addHours, addMinutes, addSeconds, addMilliseconds, addMicroseconds, addNanoseconds
+## addYears
 
-These functions add units of the interval specified by the function name to a date, a date with time or a string-encoded date / date with time. A date or date with time is returned.
+Adds a specified number of years to a date, a date with time or a string-encoded date / date with time.
 
-Example:
+**Syntax**
 
-``` sql
+```sql
+addYears(date, x)
+```
+
+**Parameters**
+
+- `date`: Date / date with time to add specified number of years to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of years to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date` plus `x` years. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
 WITH
     toDate('2024-01-01') AS date,
     toDateTime('2024-01-01 00:00:00') AS date_time,
@@ -2574,12 +2588,456 @@ SELECT
     addYears(date_time_string, 1) AS add_years_with_date_time_string
 ```
 
-``` text
+```response
 ┌─add_years_with_date─┬─add_years_with_date_time─┬─add_years_with_date_time_string─┐
 │          2025-01-01 │      2025-01-01 00:00:00 │         2025-01-01 00:00:00.000 │
 └─────────────────────┴──────────────────────────┴─────────────────────────────────┘
 ```
 
+## addQuarters
+
+Adds a specified number of quarters to a date, a date with time or a string-encoded date / date with time.
+
+**Syntax**
+
+```sql
+addQuarters(date, x)
+```
+
+**Parameters**
+
+- `date`: Date / date with time to add specified number of quarters to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of quarters to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date` plus `x` quarters. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDate('2024-01-01') AS date,
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addQuarters(date, 1) AS add_quarters_with_date,
+    addQuarters(date_time, 1) AS add_quarters_with_date_time,
+    addQuarters(date_time_string, 1) AS add_quarters_with_date_time_string
+```
+
+```response
+┌─add_quarters_with_date─┬─add_quarters_with_date_time─┬─add_quarters_with_date_time_string─┐
+│             2024-04-01 │         2024-04-01 00:00:00 │            2024-04-01 00:00:00.000 │
+└────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
+```
+
+## addMonths
+
+Adds a specified number of months to a date, a date with time or a string-encoded date / date with time.
+
+**Syntax**
+
+```sql
+addMonths(date, x)
+```
+
+**Parameters**
+
+- `date`: Date / date with time to add specified number of months to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of months to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date` plus `x` months. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDate('2024-01-01') AS date,
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addMonths(date, 6) AS add_months_with_date,
+    addMonths(date_time, 6) AS add_months_with_date_time,
+    addMonths(date_time_string, 6) AS add_months_with_date_time_string
+```
+
+```response
+┌─add_months_with_date─┬─add_months_with_date_time─┬─add_months_with_date_time_string─┐
+│           2024-07-01 │       2024-07-01 00:00:00 │          2024-07-01 00:00:00.000 │
+└──────────────────────┴───────────────────────────┴──────────────────────────────────┘
+```
+
+## addWeeks
+
+Adds a specified number of weeks to a date, a date with time or a string-encoded date / date with time.
+
+**Syntax**
+
+```sql
+addWeeks(date, x)
+```
+
+**Parameters**
+
+- `date`: Date / date with time to add specified number of weeks to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of weeks to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date` plus `x` weeks. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDate('2024-01-01') AS date,
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addWeeks(date, 5) AS add_weeks_with_date,
+    addWeeks(date_time, 5) AS add_weeks_with_date_time,
+    addWeeks(date_time_string, 5) AS add_weeks_with_date_time_string
+```
+
+```response
+┌─add_weeks_with_date─┬─add_weeks_with_date_time─┬─add_weeks_with_date_time_string─┐
+│          2024-02-05 │      2024-02-05 00:00:00 │         2024-02-05 00:00:00.000 │
+└─────────────────────┴──────────────────────────┴─────────────────────────────────┘
+```
+
+## addDays
+
+Adds a specified number of days to a date, a date with time or a string-encoded date / date with time.
+
+**Syntax**
+
+```sql
+addDays(date, x)
+```
+
+**Parameters**
+
+- `date`: Date / date with time to add specified number of days to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of days to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date` plus `x` days. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDate('2024-01-01') AS date,
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addDays(date, 5) AS add_days_with_date,
+    addDays(date_time, 5) AS add_days_with_date_time,
+    addDays(date_time_string, 5) AS add_days_with_date_time_string
+```
+
+```response
+┌─add_days_with_date─┬─add_days_with_date_time─┬─add_days_with_date_time_string─┐
+│         2024-01-06 │     2024-01-06 00:00:00 │        2024-01-06 00:00:00.000 │
+└────────────────────┴─────────────────────────┴────────────────────────────────┘
+```
+
+## addHours
+
+Adds a specified number of days to a date, a date with time or a string-encoded date / date with time.
+
+**Syntax**
+
+```sql
+addHours(date, x)
+```
+
+**Parameters**
+
+- `date`: Date / date with time to add specified number of hours to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of hours to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date` plus `x` hours. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDate('2024-01-01') AS date,
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addHours(date, 12) AS add_hours_with_date,
+    addHours(date_time, 12) AS add_hours_with_date_time,
+    addHours(date_time_string, 12) AS add_hours_with_date_time_string
+```
+
+```response
+┌─add_hours_with_date─┬─add_hours_with_date_time─┬─add_hours_with_date_time_string─┐
+│ 2024-01-01 12:00:00 │      2024-01-01 12:00:00 │         2024-01-01 12:00:00.000 │
+└─────────────────────┴──────────────────────────┴─────────────────────────────────┘
+```
+
+## addMinutes
+
+Adds a specified number of minutes to a date, a date with time or a string-encoded date / date with time.
+
+**Syntax**
+
+```sql
+addMinutes(date, x)
+```
+
+**Parameters**
+
+- `date`: Date / date with time to add specified number of minutes to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of minutes to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date` plus `x` minutes. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDate('2024-01-01') AS date,
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addMinutes(date, 20) AS add_minutes_with_date,
+    addMinutes(date_time, 20) AS add_minutes_with_date_time,
+    addMinutes(date_time_string, 20) AS add_minutes_with_date_time_string
+```
+
+```response
+┌─add_minutes_with_date─┬─add_minutes_with_date_time─┬─add_minutes_with_date_time_string─┐
+│   2024-01-01 00:20:00 │        2024-01-01 00:20:00 │           2024-01-01 00:20:00.000 │
+└───────────────────────┴────────────────────────────┴───────────────────────────────────┘
+```
+
+## addSeconds
+
+Adds a specified number of seconds to a date, a date with time or a string-encoded date / date with time.
+
+**Syntax**
+
+```sql
+addSeconds(date, x)
+```
+
+**Parameters**
+
+- `date`: Date / date with time to add specified number of seconds to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of seconds to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date` plus `x` seconds. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDate('2024-01-01') AS date,
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addSeconds(date, 30) AS add_seconds_with_date,
+    addSeconds(date_time, 30) AS add_seconds_with_date_time,
+    addSeconds(date_time_string, 30) AS add_seconds_with_date_time_string
+```
+
+```response
+┌─add_seconds_with_date─┬─add_seconds_with_date_time─┬─add_seconds_with_date_time_string─┐
+│   2024-01-01 00:00:30 │        2024-01-01 00:00:30 │           2024-01-01 00:00:30.000 │
+└───────────────────────┴────────────────────────────┴───────────────────────────────────┘
+```
+
+## addMilliseconds
+
+Adds a specified number of milliseconds to a date with time or a string-encoded date with time.
+
+**Syntax**
+
+```sql
+addMilliseconds(date_time, x)
+```
+
+**Parameters**
+
+- `date_time`: Date with time to add specified number of milliseconds to. [datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of milliseconds to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date_time` plus `x` milliseconds. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addMilliseconds(date_time, 1000) AS add_milliseconds_with_date_time,
+    addMilliseconds(date_time_string, 1000) AS add_milliseconds_with_date_time_string
+```
+
+```response
+┌─add_milliseconds_with_date_time─┬─add_milliseconds_with_date_time_string─┐
+│         2024-01-01 00:00:01.000 │                2024-01-01 00:00:01.000 │
+└─────────────────────────────────┴────────────────────────────────────────┘
+```
+
+## addMicroseconds
+
+Adds a specified number of microseconds to a date with time or a string-encoded date with time.
+
+**Syntax**
+
+```sql
+addMicroseconds(date_time, x)
+```
+
+**Parameters**
+
+- `date_time`: Date with time to add specified number of microseconds to. [datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of microseconds to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date_time` plus `x` microseconds. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addMicroseconds(date_time, 1000000) AS add_microseconds_with_date_time,
+    addMicroseconds(date_time_string, 1000000) AS add_microseconds_with_date_time_string
+```
+
+```response
+┌─add_microseconds_with_date_time─┬─add_microseconds_with_date_time_string─┐
+│      2024-01-01 00:00:01.000000 │             2024-01-01 00:00:01.000000 │
+└─────────────────────────────────┴────────────────────────────────────────┘
+```
+
+## addNanoseconds
+
+Adds a specified number of microseconds to a date with time or a string-encoded date with time.
+
+**Syntax**
+
+```sql
+addNanoseconds(date_time, x)
+```
+
+**Parameters**
+
+- `date_time`: Date with time to add specified number of nanoseconds to. [datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `x`: Number of nanoseconds to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+
+**Returned value**
+- Returns `date_time` plus `x` nanoseconds. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+```sql
+WITH
+    toDateTime('2024-01-01 00:00:00') AS date_time,
+    '2024-01-01 00:00:00' AS date_time_string
+SELECT
+    addNanoseconds(date_time, 1000) AS add_nanoseconds_with_date_time,
+    addNanoseconds(date_time_string, 1000) AS add_nanoseconds_with_date_time_string
+```
+
+```response
+┌─add_nanoseconds_with_date_time─┬─add_nanoseconds_with_date_time_string─┐
+│  2024-01-01 00:00:00.000001000 │         2024-01-01 00:00:00.000001000 │
+└────────────────────────────────┴───────────────────────────────────────┘
+```
+
+## addInterval
+
+Adds an interval to another interval or tuple of intervals.
+
+**Syntax**
+
+```sql
+addInterval(interval_1, interval_2)
+```
+
+**Parameters**
+
+- `interval_1`: First interval or interval of tuples. [interval](../data-types/special-data-types/interval.md), [tuple](../data-types/tuple.md)([interval](../data-types/special-data-types/interval.md)).
+- `interval_2`: Second interval to be added. [interval](../data-types/special-data-types/interval.md).
+
+**Returned value**
+- Returns a tuple of intervals. [tuple](../data-types/tuple.md)([interval](../data-types/special-data-types/interval.md)).
+
+:::note
+If the types of the first interval (or the interval in the tuple) and the second interval are the same they will be merged into one interval.
+:::
+
+**Example**
+
+Query:
+
+```sql
+SELECT addInterval(INTERVAL 1 DAY, INTERVAL 1 MONTH);
+SELECT addInterval((INTERVAL 1 DAY, INTERVAL 1 YEAR), INTERVAL 1 MONTH);
+SELECT addInterval(INTERVAL 2 DAY, INTERVAL 1 DAY);
+```
+
+Result:
+
+```response
+┌─addInterval(toIntervalDay(1), toIntervalMonth(1))─┐
+│ (1,1)                                             │
+└───────────────────────────────────────────────────┘
+┌─addInterval((toIntervalDay(1), toIntervalYear(1)), toIntervalMonth(1))─┐
+│ (1,1,1)                                                                │
+└────────────────────────────────────────────────────────────────────────┘
+┌─addInterval(toIntervalDay(2), toIntervalDay(1))─┐
+│ (3)                                             │
+└─────────────────────────────────────────────────┘
+```
+
+## addTupleOfIntervals
+
+Consecutively adds a tuple of intervals to a Date or a DateTime.
+
+**Syntax**
+
+```sql
+addTupleOfIntervals(interval_1, interval_2)
+```
+
+**Parameters**
+
+- `date`: First interval or interval of tuples. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- `intervals`: Tuple of intervals to add to `date`. [tuple](../data-types/tuple.md)([interval](../data-types/special-data-types/interval.md)).
+
+**Returned value**
+- Returns `date` with added `intervals`. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+
+**Example**
+
+Query:
+
+```sql
+WITH toDate('2018-01-01') AS date SELECT addTupleOfIntervals(date, (INTERVAL 1 DAY, INTERVAL 1 MONTH, INTERVAL 1 YEAR))
+```
+
+Result:
+
+```response
+┌─addTupleOfIntervals(date, (toIntervalDay(1), toIntervalMonth(1), toIntervalYear(1)))─┐
+│                                                                           2019-02-02 │
+└──────────────────────────────────────────────────────────────────────────────────────┘
+```
+
 ## subtractYears, subtractQuarters, subtractMonths, subtractWeeks, subtractDays, subtractHours, subtractMinutes, subtractSeconds, subtractMilliseconds, subtractMicroseconds, subtractNanoseconds
 
 These functions subtract units of the interval specified by the function name from a date, a date with time or a string-encoded date / date with time. A date or date with time is returned.
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index e7477ffc5e1..441df44dd3f 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1088,6 +1088,8 @@ addQuarters
 addSeconds
 addWeeks
 addYears
+addInterval
+addTupleOfIntervals
 addr
 addressToLine
 addressToLineWithInlines

From 4e6e234d24eb46d62c7e7f0e99a1ecccda5cc0f4 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 3 May 2024 12:19:57 +0200
Subject: [PATCH 071/289] Safer parent part access

---
 src/Storages/MergeTree/MergeTreeReadPoolBase.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp b/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
index 0cbb0a86b2f..3e10285d6b0 100644
--- a/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
+++ b/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
@@ -113,9 +113,9 @@ MergeTreeReadTaskPtr MergeTreeReadPoolBase::createTask(
         ? std::make_unique<MergeTreeBlockSizePredictor>(*read_info->shared_size_predictor)
         : nullptr; /// make a copy
 
-    auto get_part_name = [](const auto & task_info) -> const String &
+    auto get_part_name = [](const auto & task_info) -> String
     {
-        return task_info.data_part->isProjectionPart() ? task_info.data_part->getParentPart()->name : task_info.data_part->name;
+        return task_info.data_part->isProjectionPart() ? task_info.data_part->getParentPartName() : task_info.data_part->name;
     };
 
     auto extras = getExtras();

From 314573b7a66a2379aecb0b8e680d24561f00e03e Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 3 May 2024 12:40:05 +0200
Subject: [PATCH 072/289] Add debug check

---
 .../MergeTree/MergeTreeReadPoolBase.cpp       | 23 ++++++++++++++++++-
 1 file changed, 22 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp b/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
index 3e10285d6b0..c759a12e151 100644
--- a/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
+++ b/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
@@ -6,6 +6,11 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
 MergeTreeReadPoolBase::MergeTreeReadPoolBase(
     RangesInDataParts && parts_,
     VirtualFields shared_virtual_fields_,
@@ -115,7 +120,23 @@ MergeTreeReadTaskPtr MergeTreeReadPoolBase::createTask(
 
     auto get_part_name = [](const auto & task_info) -> String
     {
-        return task_info.data_part->isProjectionPart() ? task_info.data_part->getParentPartName() : task_info.data_part->name;
+        const auto & data_part = task_info.data_part;
+
+        if (data_part->isProjectionPart())
+        {
+            auto parent_part_name = data_part->getParentPartName();
+
+            auto parent_part = data_part->storage.getPartIfExists(
+                parent_part_name, {MergeTreeDataPartState::PreActive, MergeTreeDataPartState::Active, MergeTreeDataPartState::Outdated});
+
+            if (!parent_part)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Did not find parent part {} for potentially broken projection part {}",
+                            parent_part_name, data_part->getDataPartStorage().getFullPath());
+
+            return parent_part_name;
+        }
+
+        return data_part->name;
     };
 
     auto extras = getExtras();

From 9e670fe67cd560638ffd731ba391333bb7b78ee8 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Fri, 3 May 2024 18:38:09 +0200
Subject: [PATCH 073/289] Fix logical error during SELECT query after ALTER in
 rare case

---
 src/Storages/MergeTree/IMergeTreeReader.cpp   |   9 +-
 ...rop_column_zookeeper_on_steroids.reference |  11 ++
 ...r_add_drop_column_zookeeper_on_steroids.sh | 149 ++++++++++++++++++
 3 files changed, 168 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03144_parallel_alter_add_drop_column_zookeeper_on_steroids.reference
 create mode 100755 tests/queries/0_stateless/03144_parallel_alter_add_drop_column_zookeeper_on_steroids.sh

diff --git a/src/Storages/MergeTree/IMergeTreeReader.cpp b/src/Storages/MergeTree/IMergeTreeReader.cpp
index cf6b64aac85..54da03d1756 100644
--- a/src/Storages/MergeTree/IMergeTreeReader.cpp
+++ b/src/Storages/MergeTree/IMergeTreeReader.cpp
@@ -152,7 +152,14 @@ void IMergeTreeReader::evaluateMissingDefaults(Block additional_columns, Columns
             if (res_columns[pos] == nullptr)
                 continue;
 
-            additional_columns.insert({res_columns[pos], name_and_type->type, name_and_type->name});
+            /// We must take column type from part if it exists. Because at the end of defaults
+            /// calculations we will materialize ALL the columns, not only missing.
+            /// If column doesn't exist in part than it will be substituted with default expression
+            const auto * column_in_part = part_columns.tryGet(name_and_type->name);
+            if (column_in_part != nullptr)
+                additional_columns.insert({res_columns[pos], column_in_part->type, name_and_type->name});
+            else
+                additional_columns.insert({res_columns[pos], name_and_type->type, name_and_type->name});
         }
 
         auto dag = DB::evaluateMissingDefaults(
diff --git a/tests/queries/0_stateless/03144_parallel_alter_add_drop_column_zookeeper_on_steroids.reference b/tests/queries/0_stateless/03144_parallel_alter_add_drop_column_zookeeper_on_steroids.reference
new file mode 100644
index 00000000000..ed135e928a9
--- /dev/null
+++ b/tests/queries/0_stateless/03144_parallel_alter_add_drop_column_zookeeper_on_steroids.reference
@@ -0,0 +1,11 @@
+Starting alters
+Finishing alters
+Equal number of columns
+Replication did not hang: synced all replicas of concurrent_alter_add_drop_steroids_
+Consistency: 1
+0
+0
+0
+0
+0
+0
diff --git a/tests/queries/0_stateless/03144_parallel_alter_add_drop_column_zookeeper_on_steroids.sh b/tests/queries/0_stateless/03144_parallel_alter_add_drop_column_zookeeper_on_steroids.sh
new file mode 100755
index 00000000000..ea7bb8f7ad0
--- /dev/null
+++ b/tests/queries/0_stateless/03144_parallel_alter_add_drop_column_zookeeper_on_steroids.sh
@@ -0,0 +1,149 @@
+#!/usr/bin/env bash
+# Tags: zookeeper, no-parallel, no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+# shellcheck source=./replication.lib
+. "$CURDIR"/replication.lib
+
+REPLICAS=3
+
+for i in $(seq $REPLICAS); do
+    $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS concurrent_alter_add_drop_steroids_$i"
+done
+
+
+for i in $(seq $REPLICAS); do
+    $CLICKHOUSE_CLIENT --query "CREATE TABLE concurrent_alter_add_drop_steroids_$i (key UInt64, value0 UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/concurrent_alter_add_drop_steroids_column', '$i') ORDER BY key SETTINGS max_replicated_mutations_in_queue = 1000, number_of_free_entries_in_pool_to_execute_mutation = 0, max_replicated_merges_in_queue = 1000, index_granularity = 8192, index_granularity_bytes = '10Mi'"
+done
+
+$CLICKHOUSE_CLIENT --query "INSERT INTO concurrent_alter_add_drop_steroids_1 SELECT number, number + 10 from numbers(100000)"
+
+for i in $(seq $REPLICAS); do
+    $CLICKHOUSE_CLIENT --query "SYSTEM SYNC REPLICA concurrent_alter_add_drop_steroids_$i"
+done
+
+
+function alter_thread()
+{
+    while true; do
+        REPLICA=$(($RANDOM % 3 + 1))
+        ADD=$(($RANDOM % 5 + 1))
+        $CLICKHOUSE_CLIENT --query "ALTER TABLE concurrent_alter_add_drop_steroids_$REPLICA ADD COLUMN value$ADD UInt32 DEFAULT 42 SETTINGS replication_alter_partitions_sync=0"; # additionaly we don't wait anything for more heavy concurrency
+        DROP=$(($RANDOM % 5 + 1))
+        $CLICKHOUSE_CLIENT --query "ALTER TABLE concurrent_alter_add_drop_steroids_$REPLICA DROP COLUMN value$DROP SETTINGS replication_alter_partitions_sync=0"; # additionaly we don't wait anything for more heavy concurrency
+        sleep 0.$RANDOM
+    done
+}
+
+function alter_thread_1()
+{
+    while true; do
+        REPLICA=$(($RANDOM % 3 + 1))
+        ${CLICKHOUSE_CLIENT} --query "ALTER TABLE concurrent_alter_add_drop_steroids_1 MODIFY COLUMN value0 String SETTINGS mutations_sync = 0"
+        sleep 1.$RANDOM
+        ${CLICKHOUSE_CLIENT} --query "ALTER TABLE concurrent_alter_add_drop_steroids_1 MODIFY COLUMN value0 UInt8 SETTINGS mutations_sync = 0"
+        sleep 1.$RANDOM
+    done
+
+}
+
+function optimize_thread()
+{
+    while true; do
+        REPLICA=$(($RANDOM % 3 + 1))
+        $CLICKHOUSE_CLIENT --query "OPTIMIZE TABLE concurrent_alter_add_drop_steroids_$REPLICA FINAL SETTINGS replication_alter_partitions_sync=0";
+        sleep 0.$RANDOM
+    done
+}
+
+function insert_thread()
+{
+    while true; do
+        REPLICA=$(($RANDOM % 3 + 1))
+        $CLICKHOUSE_CLIENT --query "INSERT INTO concurrent_alter_add_drop_steroids_$REPLICA VALUES($RANDOM, 7)"
+        sleep 0.$RANDOM
+    done
+}
+
+function select_thread()
+{
+    while true; do
+        REPLICA=$(($RANDOM % 3 + 1))
+        $CLICKHOUSE_CLIENT --query "SELECT * FROM merge(currentDatabase(), 'concurrent_alter_add_drop_steroids_') FORMAT Null"
+        sleep 0.$RANDOM
+    done
+}
+
+
+echo "Starting alters"
+export -f alter_thread;
+export -f alter_thread_1;
+export -f select_thread;
+export -f optimize_thread;
+export -f insert_thread;
+
+
+TIMEOUT=30
+
+# Sometimes we detach and attach tables
+timeout $TIMEOUT bash -c alter_thread 2> /dev/null &
+timeout $TIMEOUT bash -c alter_thread 2> /dev/null &
+timeout $TIMEOUT bash -c alter_thread 2> /dev/null &
+
+timeout $TIMEOUT bash -c alter_thread_1 2> /dev/null &
+timeout $TIMEOUT bash -c alter_thread_1 2> /dev/null &
+timeout $TIMEOUT bash -c alter_thread_1 2> /dev/null &
+
+timeout $TIMEOUT bash -c select_thread 2> /dev/null &
+timeout $TIMEOUT bash -c select_thread 2> /dev/null &
+timeout $TIMEOUT bash -c select_thread 2> /dev/null &
+
+timeout $TIMEOUT bash -c optimize_thread 2> /dev/null &
+timeout $TIMEOUT bash -c optimize_thread 2> /dev/null &
+timeout $TIMEOUT bash -c optimize_thread 2> /dev/null &
+
+timeout $TIMEOUT bash -c insert_thread 2> /dev/null &
+timeout $TIMEOUT bash -c insert_thread 2> /dev/null &
+timeout $TIMEOUT bash -c insert_thread 2> /dev/null &
+timeout $TIMEOUT bash -c insert_thread 2> /dev/null &
+timeout $TIMEOUT bash -c insert_thread 2> /dev/null &
+
+wait
+
+echo "Finishing alters"
+
+columns1=$($CLICKHOUSE_CLIENT --query "select count() from system.columns where table='concurrent_alter_add_drop_steroids_1' and database='$CLICKHOUSE_DATABASE'" 2> /dev/null)
+columns2=$($CLICKHOUSE_CLIENT --query "select count() from system.columns where table='concurrent_alter_add_drop_steroids_2' and database='$CLICKHOUSE_DATABASE'" 2> /dev/null)
+columns3=$($CLICKHOUSE_CLIENT --query "select count() from system.columns where table='concurrent_alter_add_drop_steroids_3' and database='$CLICKHOUSE_DATABASE'" 2> /dev/null)
+
+while [ "$columns1" != "$columns2" ] || [ "$columns2" != "$columns3" ]; do
+    columns1=$($CLICKHOUSE_CLIENT --query "select count() from system.columns where table='concurrent_alter_add_drop_steroids_1' and database='$CLICKHOUSE_DATABASE'" 2> /dev/null)
+    columns2=$($CLICKHOUSE_CLIENT --query "select count() from system.columns where table='concurrent_alter_add_drop_steroids_2' and database='$CLICKHOUSE_DATABASE'" 2> /dev/null)
+    columns3=$($CLICKHOUSE_CLIENT --query "select count() from system.columns where table='concurrent_alter_add_drop_steroids_3' and database='$CLICKHOUSE_DATABASE'" 2> /dev/null)
+
+    sleep 1
+done
+
+echo "Equal number of columns"
+
+# This alter will finish all previous, but replica 1 maybe still not up-to-date
+while [[ $(timeout 120 ${CLICKHOUSE_CLIENT} --query "ALTER TABLE concurrent_alter_add_drop_steroids_1 MODIFY COLUMN value0 String SETTINGS replication_alter_partitions_sync=2" 2>&1) ]]; do
+    sleep 1
+done
+
+check_replication_consistency "concurrent_alter_add_drop_steroids_" "count(), sum(key), sum(cityHash64(value0))"
+
+for i in $(seq $REPLICAS); do
+    $CLICKHOUSE_CLIENT --query "SYSTEM SYNC REPLICA concurrent_alter_add_drop_steroids_$i"
+    $CLICKHOUSE_CLIENT --query "SELECT COUNT() FROM system.mutations WHERE is_done = 0 and table = 'concurrent_alter_add_drop_steroids_$i'"
+    $CLICKHOUSE_CLIENT --query "SELECT * FROM system.mutations WHERE is_done = 0 and table = 'concurrent_alter_add_drop_steroids_$i'"
+    $CLICKHOUSE_CLIENT --query "SELECT COUNT() FROM system.replication_queue WHERE table = 'concurrent_alter_add_drop_steroids_$i'"
+    $CLICKHOUSE_CLIENT --query "SELECT * FROM system.replication_queue WHERE table = 'concurrent_alter_add_drop_steroids_$i' and (type = 'ALTER_METADATA' or type = 'MUTATE_PART')"
+
+    $CLICKHOUSE_CLIENT --query "DETACH TABLE concurrent_alter_add_drop_steroids_$i"
+    $CLICKHOUSE_CLIENT --query "ATTACH TABLE concurrent_alter_add_drop_steroids_$i"
+
+    $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS concurrent_alter_add_drop_steroids_$i"
+done

From ec15298b824d6e51a7549ec79260a0c349174d98 Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Sun, 28 Apr 2024 14:20:59 +0300
Subject: [PATCH 074/289] First working prototype

---
 src/Core/Settings.h                      |  1 +
 src/Interpreters/GraceHashJoin.cpp       |  1 +
 src/Interpreters/HashJoin.cpp            | 37 +++++++++--
 src/Interpreters/HashJoin.h              | 14 ++++
 src/Interpreters/JoinedTables.cpp        |  2 +-
 src/Interpreters/TableJoin.cpp           |  4 +-
 src/Interpreters/TableJoin.h             | 10 ++-
 src/Interpreters/TemporaryDataOnDisk.cpp | 85 ++++++++++++++++--------
 src/Interpreters/TemporaryDataOnDisk.h   | 27 +++++++-
 src/Planner/PlannerJoinTree.cpp          |  2 +-
 10 files changed, 147 insertions(+), 36 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 7ed175d38f4..5dc80912ebb 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -463,6 +463,7 @@ class IColumn;
     M(UInt64, partial_merge_join_rows_in_right_blocks, 65536, "Split right-hand joining data in blocks of specified size. It's a portion of data indexed by min-max values and possibly unloaded on disk.", 0) \
     M(UInt64, join_on_disk_max_files_to_merge, 64, "For MergeJoin on disk set how much files it's allowed to sort simultaneously. Then this value bigger then more memory used and then less disk I/O needed. Minimum is 2.", 0) \
     M(UInt64, max_rows_in_set_to_optimize_join, 0, "Maximal size of the set to filter joined tables by each other row sets before joining. 0 - disable.", 0) \
+    M(UInt64, cross_join_max_bytes_inmemory, 1000000, "Maximal bytes to complete cross join inmemory.", 0) \
     \
     M(Bool, compatibility_ignore_collation_in_create_table, true, "Compatibility ignore collation in create table", 0) \
     \
diff --git a/src/Interpreters/GraceHashJoin.cpp b/src/Interpreters/GraceHashJoin.cpp
index 53d1f48c291..ba51953e979 100644
--- a/src/Interpreters/GraceHashJoin.cpp
+++ b/src/Interpreters/GraceHashJoin.cpp
@@ -657,6 +657,7 @@ IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
 
 GraceHashJoin::InMemoryJoinPtr GraceHashJoin::makeInMemoryJoin(const String & bucket_id, size_t reserve_num)
 {
+    LOG_INFO(log, "GreaceHashJoin\n");
     return std::make_unique<HashJoin>(table_join, right_sample_block, any_take_last_row, reserve_num, bucket_id);
 }
 
diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 9b05edbce36..e194df4e660 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -35,6 +35,7 @@
 #include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
 #include <Common/formatReadable.h>
+#include "Core/Joins.h"
 
 #include <Functions/FunctionHelpers.h>
 #include <Interpreters/castColumn.h>
@@ -249,11 +250,13 @@ HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_s
     , instance_id(instance_id_)
     , asof_inequality(table_join->getAsofInequality())
     , data(std::make_shared<RightTableData>())
+    , tmp_data(std::make_unique<TemporaryDataOnDisk>(table_join_->getTempDataOnDisk()))
     , right_sample_block(right_sample_block_)
     , max_joined_block_rows(table_join->maxJoinedBlockRows())
     , instance_log_id(!instance_id_.empty() ? "(" + instance_id_ + ") " : "")
     , log(getLogger("HashJoin"))
 {
+    LOG_INFO(log, "KEK CONSTRUCTOR {}\n", reserve_num);
     LOG_TRACE(log, "{}Keys: {}, datatype: {}, kind: {}, strictness: {}, right header: {}",
         instance_log_id, TableJoin::formatClauses(table_join->getClauses(), true), data->type, kind, strictness, right_sample_block.dumpStructure());
 
@@ -827,6 +830,16 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
     if (shrink_blocks)
         block_to_save = block_to_save.shrinkToFit();
 
+
+    if (kind == JoinKind::Cross)
+    {
+        if (tmp_stream == nullptr)
+        {
+            tmp_stream = &tmp_data->createStream(right_sample_block);
+        }
+        tmp_stream->write(block_to_save);
+    }
+
     size_t total_rows = 0;
     size_t total_bytes = 0;
     {
@@ -928,6 +941,7 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
 
             if (!flag_per_row && !is_inserted)
             {
+                LOG_INFO(log, "LOL\n\n\n\n\n\n");
                 LOG_TRACE(log, "Skipping inserting block with {} rows", rows);
                 data->blocks_allocated_size -= stored_block->allocatedBytes();
                 data->blocks.pop_back();
@@ -944,7 +958,6 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
 
     shrinkStoredBlocksToFit(total_bytes);
 
-
     return table_join->sizeLimits().check(total_rows, total_bytes, "JOIN", ErrorCodes::SET_SIZE_LIMIT_EXCEEDED);
 }
 
@@ -2275,13 +2288,13 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
     for (size_t left_row = start_left_row; left_row < rows_left; ++left_row)
     {
         size_t block_number = 0;
-        for (const Block & compressed_block_right : data->blocks)
+
+        auto process_right_block = [&](const Block & block_right)
         {
             ++block_number;
             if (block_number < start_right_block)
-                continue;
+                return;
 
-            auto block_right = compressed_block_right.decompress();
 
             size_t rows_right = block_right.rows();
             rows_added += rows_right;
@@ -2294,6 +2307,22 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
                 const IColumn & column_right = *block_right.getByPosition(col_num).column;
                 dst_columns[num_existing_columns + col_num]->insertRangeFrom(column_right, 0, rows_right);
             }
+        };
+
+        if (tmp_stream)
+        {
+            tmp_stream->finishWritingAsyncSafe();
+            auto reader = tmp_stream->getReadStream();
+            while (auto block_right = reader->read())
+            {
+                process_right_block(block_right);
+            }
+        }
+
+        for (const Block & compressed_block_right : data->blocks)
+        {
+            auto block_right = compressed_block_right.decompress();
+            process_right_block(block_right);
         }
 
         start_right_block = 0;
diff --git a/src/Interpreters/HashJoin.h b/src/Interpreters/HashJoin.h
index b7f41a7eb6b..1eb4d0f8030 100644
--- a/src/Interpreters/HashJoin.h
+++ b/src/Interpreters/HashJoin.h
@@ -26,6 +26,7 @@
 
 #include <Storages/IStorage_fwd.h>
 #include <Interpreters/IKeyValueEntity.h>
+#include <Interpreters/TemporaryDataOnDisk.h>
 
 namespace DB
 {
@@ -414,6 +415,15 @@ public:
 
     void setMaxJoinedBlockRows(size_t value) { max_joined_block_rows = value; }
 
+    TemporaryFileStream* getStreamForCrossJoin()
+    {
+        auto streams = tmp_data->getStreams();
+        assert(streams.size() <= 1);
+        if (streams.empty())
+            return nullptr;
+        return streams[0];
+    }
+
 private:
     friend class NotJoinedHash;
 
@@ -442,6 +452,10 @@ private:
     RightTableDataPtr data;
     std::vector<Sizes> key_sizes;
 
+    /// Needed to do external cross join
+    TemporaryDataOnDiskPtr tmp_data;
+    TemporaryFileStream* tmp_stream{nullptr};
+
     /// Block with columns from the right-side table.
     Block right_sample_block;
     /// Block with columns from the right-side table except key columns.
diff --git a/src/Interpreters/JoinedTables.cpp b/src/Interpreters/JoinedTables.cpp
index 5b549a19083..457ed3ef4a6 100644
--- a/src/Interpreters/JoinedTables.cpp
+++ b/src/Interpreters/JoinedTables.cpp
@@ -310,7 +310,7 @@ std::shared_ptr<TableJoin> JoinedTables::makeTableJoin(const ASTSelectQuery & se
     auto settings = context->getSettingsRef();
     MultiEnum<JoinAlgorithm> join_algorithm = settings.join_algorithm;
     bool try_use_direct_join = join_algorithm.isSet(JoinAlgorithm::DIRECT) || join_algorithm.isSet(JoinAlgorithm::DEFAULT);
-    auto table_join = std::make_shared<TableJoin>(settings, context->getGlobalTemporaryVolume());
+    auto table_join = std::make_shared<TableJoin>(settings, context->getGlobalTemporaryVolume(), context->getTempDataOnDisk());
 
     const ASTTablesInSelectQueryElement * ast_join = select_query_.join();
     const auto & table_to_join = ast_join->table_expression->as<ASTTableExpression &>();
diff --git a/src/Interpreters/TableJoin.cpp b/src/Interpreters/TableJoin.cpp
index 48d59dd3b24..7ceb90704f3 100644
--- a/src/Interpreters/TableJoin.cpp
+++ b/src/Interpreters/TableJoin.cpp
@@ -103,7 +103,7 @@ bool forAllKeys(OnExpr & expressions, Func callback)
 
 }
 
-TableJoin::TableJoin(const Settings & settings, VolumePtr tmp_volume_)
+TableJoin::TableJoin(const Settings & settings, VolumePtr tmp_volume_, TemporaryDataOnDiskScopePtr tmp_data_)
     : size_limits(SizeLimits{settings.max_rows_in_join, settings.max_bytes_in_join, settings.join_overflow_mode})
     , default_max_bytes(settings.default_max_bytes_in_join)
     , join_use_nulls(settings.join_use_nulls)
@@ -111,12 +111,14 @@ TableJoin::TableJoin(const Settings & settings, VolumePtr tmp_volume_)
     , cross_join_min_bytes_to_compress(settings.cross_join_min_bytes_to_compress)
     , max_joined_block_rows(settings.max_joined_block_size_rows)
     , join_algorithm(settings.join_algorithm)
+    , cross_join_max_bytes_inmemory(settings.cross_join_max_bytes_inmemory)
     , partial_merge_join_rows_in_right_blocks(settings.partial_merge_join_rows_in_right_blocks)
     , partial_merge_join_left_table_buffer_bytes(settings.partial_merge_join_left_table_buffer_bytes)
     , max_files_to_merge(settings.join_on_disk_max_files_to_merge)
     , temporary_files_codec(settings.temporary_files_codec)
     , max_memory_usage(settings.max_memory_usage)
     , tmp_volume(tmp_volume_)
+    , tmp_data(tmp_data_)
 {
 }
 
diff --git a/src/Interpreters/TableJoin.h b/src/Interpreters/TableJoin.h
index 88905edd3e8..d6920d6afbf 100644
--- a/src/Interpreters/TableJoin.h
+++ b/src/Interpreters/TableJoin.h
@@ -9,6 +9,7 @@
 #include <QueryPipeline/SizeLimits.h>
 #include <DataTypes/getLeastSupertype.h>
 #include <Interpreters/IKeyValueEntity.h>
+#include <Interpreters/TemporaryDataOnDisk.h>
 
 #include <Common/Exception.h>
 #include <Parsers/IAST_fwd.h>
@@ -144,6 +145,7 @@ private:
     const UInt64 cross_join_min_bytes_to_compress = 10000;
     const size_t max_joined_block_rows = 0;
     std::vector<JoinAlgorithm> join_algorithm;
+    const UInt64 cross_join_max_bytes_inmemory = 1000000;
     const size_t partial_merge_join_rows_in_right_blocks = 0;
     const size_t partial_merge_join_left_table_buffer_bytes = 0;
     const size_t max_files_to_merge = 0;
@@ -188,6 +190,8 @@ private:
 
     VolumePtr tmp_volume;
 
+    TemporaryDataOnDiskScopePtr tmp_data;
+
     std::shared_ptr<StorageJoin> right_storage_join;
 
     std::shared_ptr<const IKeyValueEntity> right_kv_storage;
@@ -233,7 +237,7 @@ private:
 public:
     TableJoin() = default;
 
-    TableJoin(const Settings & settings, VolumePtr tmp_volume_);
+    TableJoin(const Settings & settings, VolumePtr tmp_volume_, TemporaryDataOnDiskScopePtr tmp_data_);
 
     /// for StorageJoin
     TableJoin(SizeLimits limits, bool use_nulls, JoinKind kind, JoinStrictness strictness,
@@ -259,6 +263,8 @@ public:
 
     VolumePtr getGlobalTemporaryVolume() { return tmp_volume; }
 
+    TemporaryDataOnDiskScopePtr getTempDataOnDisk() { return tmp_data; }
+
     ActionsDAGPtr createJoinedBlockActions(ContextPtr context) const;
 
     const std::vector<JoinAlgorithm> & getEnabledJoinAlgorithms() const { return join_algorithm; }
@@ -275,6 +281,8 @@ public:
 
     bool allowParallelHashJoin() const;
 
+    UInt64 crossJoinMaxBytesInmemory() const { return cross_join_max_bytes_inmemory; }
+
     bool joinUseNulls() const { return join_use_nulls; }
 
     UInt64 crossJoinMinRowsToCompress() const { return cross_join_min_rows_to_compress; }
diff --git a/src/Interpreters/TemporaryDataOnDisk.cpp b/src/Interpreters/TemporaryDataOnDisk.cpp
index 9a237738b3e..e50d501f6d3 100644
--- a/src/Interpreters/TemporaryDataOnDisk.cpp
+++ b/src/Interpreters/TemporaryDataOnDisk.cpp
@@ -1,12 +1,11 @@
+#include <atomic>
+#include <mutex>
 #include <Interpreters/TemporaryDataOnDisk.h>
 
 #include <IO/WriteBufferFromFile.h>
-#include <IO/ReadBufferFromFile.h>
 #include <Compression/CompressedWriteBuffer.h>
-#include <Compression/CompressedReadBuffer.h>
 #include <Interpreters/Cache/FileCache.h>
 #include <Formats/NativeWriter.h>
-#include <Formats/NativeReader.h>
 #include <Core/ProtocolDefines.h>
 #include <Disks/SingleDiskVolume.h>
 #include <Disks/DiskLocal.h>
@@ -14,6 +13,7 @@
 
 #include <Core/Defines.h>
 #include <Interpreters/Cache/WriteBufferToFileSegment.h>
+#include "Common/Exception.h"
 
 namespace ProfileEvents
 {
@@ -224,33 +224,26 @@ struct TemporaryFileStream::OutputWriter
     bool finalized = false;
 };
 
-struct TemporaryFileStream::InputReader
+InputReader::InputReader(const String & path, const Block & header_, size_t size)
+    : in_file_buf(path, size ? std::min<size_t>(DBMS_DEFAULT_BUFFER_SIZE, size) : DBMS_DEFAULT_BUFFER_SIZE)
+    , in_compressed_buf(in_file_buf)
+    , in_reader(in_compressed_buf, header_, DBMS_TCP_PROTOCOL_VERSION)
 {
-    InputReader(const String & path, const Block & header_, size_t size = 0)
-        : in_file_buf(path, size ? std::min<size_t>(DBMS_DEFAULT_BUFFER_SIZE, size) : DBMS_DEFAULT_BUFFER_SIZE)
-        , in_compressed_buf(in_file_buf)
-        , in_reader(in_compressed_buf, header_, DBMS_TCP_PROTOCOL_VERSION)
-    {
-        LOG_TEST(getLogger("TemporaryFileStream"), "Reading {} from {}", header_.dumpStructure(), path);
-    }
+    LOG_TEST(getLogger("TemporaryFileStream"), "Reading {} from {}", header_.dumpStructure(), path);
+}
 
-    explicit InputReader(const String & path, size_t size = 0)
-        : in_file_buf(path, size ? std::min<size_t>(DBMS_DEFAULT_BUFFER_SIZE, size) : DBMS_DEFAULT_BUFFER_SIZE)
-        , in_compressed_buf(in_file_buf)
-        , in_reader(in_compressed_buf, DBMS_TCP_PROTOCOL_VERSION)
-    {
-        LOG_TEST(getLogger("TemporaryFileStream"), "Reading from {}", path);
-    }
+InputReader::InputReader(const String & path, size_t size)
+    : in_file_buf(path, size ? std::min<size_t>(DBMS_DEFAULT_BUFFER_SIZE, size) : DBMS_DEFAULT_BUFFER_SIZE)
+    , in_compressed_buf(in_file_buf)
+    , in_reader(in_compressed_buf, DBMS_TCP_PROTOCOL_VERSION)
+{
+    LOG_TEST(getLogger("TemporaryFileStream"), "Reading from {}", path);
+}
 
-    Block read()
-    {
-        return in_reader.read();
-    }
-
-    ReadBufferFromFile in_file_buf;
-    CompressedReadBuffer in_compressed_buf;
-    NativeReader in_reader;
-};
+Block InputReader::read()
+{
+    return in_reader.read();
+}
 
 TemporaryFileStream::TemporaryFileStream(TemporaryFileOnDiskHolder file_, const Block & header_, TemporaryDataOnDisk * parent_)
     : parent(parent_)
@@ -310,6 +303,20 @@ TemporaryFileStream::Stat TemporaryFileStream::finishWriting()
     return stat;
 }
 
+TemporaryFileStream::Stat TemporaryFileStream::finishWritingAsyncSafe()
+{
+    if (!writing_finished.load(std::memory_order_relaxed))
+    {
+        std::lock_guard lock(finish_writing);
+        if (!writing_finished.load())
+        {
+            return finishWriting();
+        }
+        writing_finished.store(true);
+    }
+    return stat;
+}
+
 bool TemporaryFileStream::isWriteFinished() const
 {
     assert(in_reader == nullptr || out_writer == nullptr);
@@ -324,6 +331,12 @@ Block TemporaryFileStream::read()
     if (isEof())
         return {};
 
+    if (auto type = read_type.exchange(1); type == 2)
+    {
+        read_type.store(2);
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Different type of reading was requested earlier");
+    }
+
     if (!in_reader)
     {
         in_reader = std::make_unique<InputReader>(getPath(), header, getSize());
@@ -334,10 +347,28 @@ Block TemporaryFileStream::read()
     {
         /// finalize earlier to release resources, do not wait for the destructor
         this->release();
+        in_reader.reset();
     }
     return block;
 }
 
+std::unique_ptr<InputReader> TemporaryFileStream::getReadStream()
+{
+    if (!isWriteFinished())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Writing has been not finished");
+
+    if (isEof())
+        return nullptr;
+
+    if (auto type = read_type.exchange(2); type == 1)
+    {
+        read_type.store(1);
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Different type of reading was requested earlier");
+    }
+
+    return std::make_unique<InputReader>(getPath(), header, getSize());
+}
+
 void TemporaryFileStream::updateAllocAndCheck()
 {
     assert(out_writer);
diff --git a/src/Interpreters/TemporaryDataOnDisk.h b/src/Interpreters/TemporaryDataOnDisk.h
index 40100a62b44..792988e94bd 100644
--- a/src/Interpreters/TemporaryDataOnDisk.h
+++ b/src/Interpreters/TemporaryDataOnDisk.h
@@ -1,7 +1,11 @@
 #pragma once
 
+#include <atomic>
 #include <boost/noncopyable.hpp>
 
+#include <IO/ReadBufferFromFile.h>
+#include <Compression/CompressedReadBuffer.h>
+#include <Formats/NativeReader.h>
 #include <Core/Block.h>
 #include <Disks/IVolume.h>
 #include <Disks/TemporaryFileOnDisk.h>
@@ -130,6 +134,19 @@ private:
     typename CurrentMetrics::Metric current_metric_scope = CurrentMetrics::TemporaryFilesUnknown;
 };
 
+struct InputReader
+{
+    InputReader(const String & path, const Block & header_, size_t size = 0);
+
+    explicit InputReader(const String & path, size_t size = 0);
+
+    Block read();
+
+    ReadBufferFromFile in_file_buf;
+    CompressedReadBuffer in_compressed_buf;
+    NativeReader in_reader;
+};
+
 /*
  * Data can be written into this stream and then read.
  * After finish writing, call `finishWriting` and then `read` to read the data.
@@ -154,8 +171,11 @@ public:
     void flush();
 
     Stat finishWriting();
+    Stat finishWritingAsyncSafe();
     bool isWriteFinished() const;
 
+    std::unique_ptr<InputReader> getReadStream();
+
     Block read();
 
     String getPath() const;
@@ -184,10 +204,15 @@ private:
 
     Stat stat;
 
+    /// 0 - means that we haven't requested any read, 1 - read from function TemporaryFileStream::read, 2 - 
+    std::atomic_char read_type{0};
+
+    mutable std::mutex finish_writing;
+    std::atomic_bool writing_finished{false};
+
     struct OutputWriter;
     std::unique_ptr<OutputWriter> out_writer;
 
-    struct InputReader;
     std::unique_ptr<InputReader> in_reader;
 };
 
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 514c19b0f89..3467299812a 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -1196,7 +1196,7 @@ JoinTreeQueryPlan buildQueryPlanForJoinNode(const QueryTreeNodePtr & join_table_
         }
     }
 
-    auto table_join = std::make_shared<TableJoin>(settings, query_context->getGlobalTemporaryVolume());
+    auto table_join = std::make_shared<TableJoin>(settings, query_context->getGlobalTemporaryVolume(), query_context->getTempDataOnDisk());
     table_join->getTableJoin() = join_node.toASTTableJoin()->as<ASTTableJoin &>();
 
     if (join_constant)

From d6690f8384235531947a09cd65f00623095f3ed4 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Mon, 6 May 2024 15:12:16 +0800
Subject: [PATCH 075/289] [feature] Raw as a synonym for TSVRaw

---
 docs/en/interfaces/formats.md                             | 6 +++---
 .../Formats/Impl/TabSeparatedRowInputFormat.cpp           | 8 ++++++++
 .../Formats/Impl/TabSeparatedRowOutputFormat.cpp          | 3 +++
 .../0_stateless/00397_tsv_format_synonym.reference        | 3 +++
 tests/queries/0_stateless/00397_tsv_format_synonym.sql    | 1 +
 5 files changed, 18 insertions(+), 3 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 03cf345349e..937dfb52609 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -206,7 +206,7 @@ SELECT * FROM nestedt FORMAT TSV
 Differs from `TabSeparated` format in that the rows are written without escaping.
 When parsing with this format, tabs or linefeeds are not allowed in each field.
 
-This format is also available under the name `TSVRaw`.
+This format is also available under the name `TSVRaw`, `Raw`.
 
 ## TabSeparatedWithNames {#tabseparatedwithnames}
 
@@ -241,14 +241,14 @@ This format is also available under the name `TSVWithNamesAndTypes`.
 Differs from `TabSeparatedWithNames` format in that the rows are written without escaping.
 When parsing with this format, tabs or linefeeds are not allowed in each field.
 
-This format is also available under the name `TSVRawWithNames`.
+This format is also available under the name `TSVRawWithNames`, `RawWithNames`.
 
 ## TabSeparatedRawWithNamesAndTypes {#tabseparatedrawwithnamesandtypes}
 
 Differs from `TabSeparatedWithNamesAndTypes` format in that the rows are written without escaping.
 When parsing with this format, tabs or linefeeds are not allowed in each field.
 
-This format is also available under the name `TSVRawWithNamesAndNames`.
+This format is also available under the name `TSVRawWithNamesAndNames`, `RawWithNamesAndNames`.
 
 ## Template {#format-template}
 
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
index 85b1797dab8..09f8fa92e5f 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
@@ -402,6 +402,8 @@ void registerInputFormatTabSeparated(FormatFactory & factory)
 
         registerWithNamesAndTypes(is_raw ? "TabSeparatedRaw" : "TabSeparated", register_func);
         registerWithNamesAndTypes(is_raw ? "TSVRaw" : "TSV", register_func);
+        if (is_raw)
+            registerWithNamesAndTypes("Raw", register_func);
     }
 }
 
@@ -433,6 +435,8 @@ void registerTSVSchemaReader(FormatFactory & factory)
 
         registerWithNamesAndTypes(is_raw ? "TabSeparatedRaw" : "TabSeparated", register_func);
         registerWithNamesAndTypes(is_raw ? "TSVRaw" : "TSV", register_func);
+        if (is_raw)
+            registerWithNamesAndTypes("Raw", register_func);
     }
 }
 
@@ -506,8 +510,12 @@ void registerFileSegmentationEngineTabSeparated(FormatFactory & factory)
 
         registerWithNamesAndTypes(is_raw ? "TSVRaw" : "TSV", register_func);
         registerWithNamesAndTypes(is_raw ? "TabSeparatedRaw" : "TabSeparated", register_func);
+        if (is_raw)
+            registerWithNamesAndTypes("Raw", register_func);
         markFormatWithNamesAndTypesSupportsSamplingColumns(is_raw ? "TSVRaw" : "TSV", factory);
         markFormatWithNamesAndTypesSupportsSamplingColumns(is_raw ? "TabSeparatedRaw" : "TabSeparated", factory);
+        if (is_raw)
+            markFormatWithNamesAndTypesSupportsSamplingColumns("Raw", factory);
     }
 
     // We can use the same segmentation engine for TSKV.
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowOutputFormat.cpp b/src/Processors/Formats/Impl/TabSeparatedRowOutputFormat.cpp
index a4a5aea26cb..c8384c09be6 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/TabSeparatedRowOutputFormat.cpp
@@ -95,7 +95,10 @@ void registerOutputFormatTabSeparated(FormatFactory & factory)
         registerWithNamesAndTypes(is_raw ? "TSVRaw" : "TSV", register_func);
         registerWithNamesAndTypes(is_raw ? "TabSeparatedRaw" : "TabSeparated", register_func);
         if (is_raw)
+        {
             registerWithNamesAndTypes("LineAsString", register_func);
+            registerWithNamesAndTypes("Raw", register_func);
+        }
     }
 }
 
diff --git a/tests/queries/0_stateless/00397_tsv_format_synonym.reference b/tests/queries/0_stateless/00397_tsv_format_synonym.reference
index c4a86983be3..c91169a06fa 100644
--- a/tests/queries/0_stateless/00397_tsv_format_synonym.reference
+++ b/tests/queries/0_stateless/00397_tsv_format_synonym.reference
@@ -28,3 +28,6 @@ UInt8	String	String
 1	hello	world
 2	hello	world
 3	hello	world
+1	hello	world
+2	hello	world
+3	hello	world
diff --git a/tests/queries/0_stateless/00397_tsv_format_synonym.sql b/tests/queries/0_stateless/00397_tsv_format_synonym.sql
index 8c69a795857..51283c6ced9 100644
--- a/tests/queries/0_stateless/00397_tsv_format_synonym.sql
+++ b/tests/queries/0_stateless/00397_tsv_format_synonym.sql
@@ -9,3 +9,4 @@ SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TSVWithN
 
 SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TabSeparatedRaw;
 SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TSVRaw;
+SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT Raw;

From ab7d457c51d92123d1845486a2f3243324f06503 Mon Sep 17 00:00:00 2001
From: Yohann Jardin <yohann.jardin@telecomnancy.net>
Date: Mon, 6 May 2024 11:35:48 +0200
Subject: [PATCH 076/289] Update ErrorCodes for functions using
 NUMBER_OF_ARGUMENTS_DOESNT_MATCH

---
 src/AggregateFunctions/AggregateFunctionAggThrow.cpp     | 4 ++--
 .../AggregateFunctionGroupArrayInsertAt.cpp              | 3 ++-
 src/AggregateFunctions/AggregateFunctionMLMethod.cpp     | 7 ++++---
 src/AggregateFunctions/AggregateFunctionMannWhitney.cpp  | 4 ++--
 src/AggregateFunctions/AggregateFunctionQuantile.cpp     | 4 ++--
 .../AggregateFunctionQuantileBFloat16Weighted.cpp        | 4 ++--
 src/AggregateFunctions/AggregateFunctionQuantileDD.cpp   | 4 ++--
 .../AggregateFunctionQuantileExactHigh.cpp               | 4 ++--
 .../AggregateFunctionQuantileExactInclusive.cpp          | 4 ++--
 .../AggregateFunctionQuantileTiming.cpp                  | 4 ++--
 src/AggregateFunctions/AggregateFunctionTopK.cpp         | 4 ++--
 src/AggregateFunctions/AggregateFunctionWelchTTest.cpp   | 4 ++--
 .../Combinators/AggregateFunctionArray.cpp               | 4 ++--
 src/AggregateFunctions/Combinators/AggregateFunctionIf.h | 4 ++--
 src/Functions/Kusto/KqlArraySort.cpp                     | 4 ++--
 src/Functions/MultiSearchFirstPositionImpl.h             | 4 ++--
 src/Functions/MultiSearchImpl.h                          | 4 ++--
 src/Functions/array/arrayEnumerateExtended.h             | 4 ++--
 src/Functions/array/arrayEnumerateRanked.h               | 7 ++++---
 src/Functions/array/arrayFold.cpp                        | 6 +++---
 src/Functions/array/arrayReduce.cpp                      | 4 ++--
 src/Functions/array/arrayZip.cpp                         | 4 ++--
 src/Functions/concat.cpp                                 | 6 +++---
 src/Functions/generateULID.cpp                           | 4 ++--
 src/Functions/jsonMergePatch.cpp                         | 4 ++--
 src/Functions/nested.cpp                                 | 9 +++++----
 src/Functions/now64.cpp                                  | 4 ++--
 src/Functions/nowInBlock.cpp                             | 4 ++--
 src/Functions/parseTimeDelta.cpp                         | 7 ++++---
 src/Functions/pointInPolygon.cpp                         | 4 ++--
 src/TableFunctions/TableFunctionValues.cpp               | 4 ++--
 31 files changed, 73 insertions(+), 68 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionAggThrow.cpp b/src/AggregateFunctions/AggregateFunctionAggThrow.cpp
index 27432bc94ba..ebf6cabbcfd 100644
--- a/src/AggregateFunctions/AggregateFunctionAggThrow.cpp
+++ b/src/AggregateFunctions/AggregateFunctionAggThrow.cpp
@@ -16,7 +16,7 @@ struct Settings;
 namespace ErrorCodes
 {
     extern const int AGGREGATE_FUNCTION_THROW;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
 namespace
@@ -116,7 +116,7 @@ void registerAggregateFunctionAggThrow(AggregateFunctionFactory & factory)
         if (parameters.size() == 1)
             throw_probability = parameters[0].safeGet<Float64>();
         else if (parameters.size() > 1)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} cannot have more than one parameter", name);
+            throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} cannot have more than one parameter", name);
 
         return std::make_shared<AggregateFunctionThrow>(argument_types, parameters, throw_probability);
     });
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArrayInsertAt.cpp b/src/AggregateFunctions/AggregateFunctionGroupArrayInsertAt.cpp
index 60e8df64283..8674aac2e90 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArrayInsertAt.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArrayInsertAt.cpp
@@ -27,6 +27,7 @@ struct Settings;
 namespace ErrorCodes
 {
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
     extern const int TOO_LARGE_ARRAY_SIZE;
     extern const int CANNOT_CONVERT_TYPE;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
@@ -74,7 +75,7 @@ public:
         if (!params.empty())
         {
             if (params.size() > 2)
-                throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at most two parameters.", getName());
+                throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} requires at most two parameters.", getName());
 
             default_value = params[0];
 
diff --git a/src/AggregateFunctions/AggregateFunctionMLMethod.cpp b/src/AggregateFunctions/AggregateFunctionMLMethod.cpp
index d2178437770..730b5cfa5cc 100644
--- a/src/AggregateFunctions/AggregateFunctionMLMethod.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMLMethod.cpp
@@ -22,7 +22,8 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
     extern const int LOGICAL_ERROR;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
 namespace
@@ -34,12 +35,12 @@ namespace
         const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings *)
     {
         if (parameters.size() > 4)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION,
                 "Aggregate function {} requires at most four parameters: "
                 "learning_rate, l2_regularization_coef, mini-batch size and weights_updater method", name);
 
         if (argument_types.size() < 2)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                 "Aggregate function {} requires at least two arguments: target and model's parameters", name);
 
         for (size_t i = 0; i < argument_types.size(); ++i)
diff --git a/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp b/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
index e7bc5df335f..d185058dbd0 100644
--- a/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
@@ -21,7 +21,7 @@ namespace ErrorCodes
 {
     extern const int NOT_IMPLEMENTED;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
     extern const int BAD_ARGUMENTS;
 }
 
@@ -141,7 +141,7 @@ public:
         : IAggregateFunctionDataHelper<MannWhitneyData, AggregateFunctionMannWhitney> ({arguments}, {}, createResultType())
     {
         if (params.size() > 2)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} require two parameter or less", getName());
+            throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} require two parameter or less", getName());
 
         if (params.empty())
         {
diff --git a/src/AggregateFunctions/AggregateFunctionQuantile.cpp b/src/AggregateFunctions/AggregateFunctionQuantile.cpp
index 4d37ec69d26..f72b28030c3 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantile.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantile.cpp
@@ -14,7 +14,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int NOT_IMPLEMENTED;
 }
@@ -118,7 +118,7 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
     if (argument_types.empty())
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} requires at least one argument", name);
 
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
index 6d881b77c16..b0a39b1fdab 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
@@ -12,7 +12,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -27,7 +27,7 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
     if (argument_types.empty())
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} requires at least one argument", name);
 
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
index f3d6b26ee75..7b1ae43038a 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
@@ -13,7 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -29,7 +29,7 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
     if (argument_types.empty())
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} requires at least one argument", name);
 
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
index b44df755158..6fa4158076c 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
@@ -13,7 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -29,7 +29,7 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
     if (argument_types.empty())
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} requires at least one argument", name);
 
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
index d8287be86ca..bed5cf95bd8 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
@@ -13,7 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -28,7 +28,7 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
     if (argument_types.empty())
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} requires at least one argument", name);
 
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
index 1bb77892c0d..e293fc6e59d 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
@@ -13,7 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -28,7 +28,7 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
     if (argument_types.empty())
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} requires at least one argument", name);
 
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
diff --git a/src/AggregateFunctions/AggregateFunctionTopK.cpp b/src/AggregateFunctions/AggregateFunctionTopK.cpp
index d0e4f507d46..26f756abe18 100644
--- a/src/AggregateFunctions/AggregateFunctionTopK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionTopK.cpp
@@ -35,7 +35,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int BAD_ARGUMENTS;
     extern const int LOGICAL_ERROR;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
 
@@ -467,7 +467,7 @@ AggregateFunctionPtr createAggregateFunctionTopK(const std::string & name, const
     if (!params.empty())
     {
         if (params.size() > 3)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION,
                             "Aggregate function '{}' requires three parameters or less", name);
 
         threshold = applyVisitor(FieldVisitorConvertToNumber<UInt64>(), params[0]);
diff --git a/src/AggregateFunctions/AggregateFunctionWelchTTest.cpp b/src/AggregateFunctions/AggregateFunctionWelchTTest.cpp
index 849f81279e7..7f1c4861fbc 100644
--- a/src/AggregateFunctions/AggregateFunctionWelchTTest.cpp
+++ b/src/AggregateFunctions/AggregateFunctionWelchTTest.cpp
@@ -7,7 +7,7 @@
 namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
 namespace DB
@@ -80,7 +80,7 @@ AggregateFunctionPtr createAggregateFunctionWelchTTest(
     assertBinary(name, argument_types);
 
     if (parameters.size() > 1)
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires zero or one parameter.", name);
+        throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} requires zero or one parameter.", name);
 
     if (!isNumber(argument_types[0]) || !isNumber(argument_types[1]))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Aggregate function {} only supports numerical types", name);
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp b/src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp
index a54092f0bcb..6b60faadf07 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp
@@ -9,7 +9,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -26,7 +26,7 @@ public:
     DataTypes transformArguments(const DataTypes & arguments) const override
     {
         if (arguments.empty())
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "-Array aggregate functions require at least one argument");
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "-Array aggregate functions require at least one argument");
 
         DataTypes nested_arguments;
         for (const auto & type : arguments)
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionIf.h b/src/AggregateFunctions/Combinators/AggregateFunctionIf.h
index a893fc91780..f57cfa41752 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionIf.h
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionIf.h
@@ -18,7 +18,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -42,7 +42,7 @@ public:
         , nested_func(nested), num_arguments(types.size())
     {
         if (num_arguments == 0)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} require at least one argument", getName());
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Aggregate function {} require at least one argument", getName());
 
         only_null_condition = types.back()->onlyNull();
 
diff --git a/src/Functions/Kusto/KqlArraySort.cpp b/src/Functions/Kusto/KqlArraySort.cpp
index 5be36328cc3..ac301c474e8 100644
--- a/src/Functions/Kusto/KqlArraySort.cpp
+++ b/src/Functions/Kusto/KqlArraySort.cpp
@@ -11,7 +11,7 @@ namespace DB
 {
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int ILLEGAL_COLUMN;
 }
@@ -35,7 +35,7 @@ public:
     {
         if (arguments.empty())
             throw Exception(
-                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                 "Function {} needs at least one argument; passed {}.",
                 getName(),
                 arguments.size());
diff --git a/src/Functions/MultiSearchFirstPositionImpl.h b/src/Functions/MultiSearchFirstPositionImpl.h
index 99dd3f9d394..aca96cabf04 100644
--- a/src/Functions/MultiSearchFirstPositionImpl.h
+++ b/src/Functions/MultiSearchFirstPositionImpl.h
@@ -10,7 +10,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
 template <typename Name, typename Impl>
@@ -37,7 +37,7 @@ struct MultiSearchFirstPositionImpl
     {
         // For performance of Volnitsky search, it is crucial to save only one byte for pattern number.
         if (needles_arr.size() > std::numeric_limits<UInt8>::max())
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION,
                 "Number of arguments for function {} doesn't match: passed {}, should be at most {}",
                 name, std::to_string(needles_arr.size()), std::to_string(std::numeric_limits<UInt8>::max()));
 
diff --git a/src/Functions/MultiSearchImpl.h b/src/Functions/MultiSearchImpl.h
index fb7d56f302a..d3d1680481f 100644
--- a/src/Functions/MultiSearchImpl.h
+++ b/src/Functions/MultiSearchImpl.h
@@ -10,7 +10,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
 template <typename Name, typename Impl>
@@ -37,7 +37,7 @@ struct MultiSearchImpl
     {
         // For performance of Volnitsky search, it is crucial to save only one byte for pattern number.
         if (needles_arr.size() > std::numeric_limits<UInt8>::max())
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION,
                 "Number of arguments for function {} doesn't match: passed {}, should be at most {}",
                 name, needles_arr.size(), std::to_string(std::numeric_limits<UInt8>::max()));
 
diff --git a/src/Functions/array/arrayEnumerateExtended.h b/src/Functions/array/arrayEnumerateExtended.h
index cf38afcfa5a..67c0981108f 100644
--- a/src/Functions/array/arrayEnumerateExtended.h
+++ b/src/Functions/array/arrayEnumerateExtended.h
@@ -18,7 +18,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_COLUMN;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int SIZES_OF_ARRAYS_DONT_MATCH;
@@ -43,7 +43,7 @@ public:
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
     {
         if (arguments.empty())
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                 "Number of arguments for function {} doesn't match: passed {}, should be at least 1.",
                 getName(), arguments.size());
 
diff --git a/src/Functions/array/arrayEnumerateRanked.h b/src/Functions/array/arrayEnumerateRanked.h
index 04fa305368d..ad325fe542a 100644
--- a/src/Functions/array/arrayEnumerateRanked.h
+++ b/src/Functions/array/arrayEnumerateRanked.h
@@ -59,7 +59,8 @@ namespace DB
 {
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int BAD_ARGUMENTS;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int SIZES_OF_ARRAYS_DONT_MATCH;
 }
 
@@ -101,7 +102,7 @@ public:
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
         if (arguments.empty())
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                 "Number of arguments for function {} doesn't match: passed {}, should be at least 1.",
                 getName(), arguments.size());
 
@@ -238,7 +239,7 @@ ColumnPtr FunctionArrayEnumerateRankedExtended<Derived>::executeImpl(
     }
 
     if (offsets_by_depth.empty())
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "No arrays passed to function {}", getName());
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "No arrays passed to function {}", getName());
 
     auto res_nested = ColumnUInt32::create();
 
diff --git a/src/Functions/array/arrayFold.cpp b/src/Functions/array/arrayFold.cpp
index 63c14f475fc..5170c9a5b5f 100644
--- a/src/Functions/array/arrayFold.cpp
+++ b/src/Functions/array/arrayFold.cpp
@@ -14,7 +14,7 @@ namespace ErrorCodes
 {
     extern const int ILLEGAL_COLUMN;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int SIZES_OF_ARRAYS_DONT_MATCH;
     extern const int TYPE_MISMATCH;
 }
@@ -41,7 +41,7 @@ public:
     void getLambdaArgumentTypes(DataTypes & arguments) const override
     {
         if (arguments.size() < 3)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Function {} requires as arguments a lambda function, at least one array and an accumulator", getName());
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} requires as arguments a lambda function, at least one array and an accumulator", getName());
 
         DataTypes accumulator_and_array_types(arguments.size() - 1);
         accumulator_and_array_types[0] = arguments.back();
@@ -64,7 +64,7 @@ public:
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
         if (arguments.size() < 3)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Function {} requires as arguments a lambda function, at least one array and an accumulator", getName());
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} requires as arguments a lambda function, at least one array and an accumulator", getName());
 
         const auto * lambda_function_type = checkAndGetDataType<DataTypeFunction>(arguments[0].type.get());
         if (!lambda_function_type)
diff --git a/src/Functions/array/arrayReduce.cpp b/src/Functions/array/arrayReduce.cpp
index d47d1ae98cc..d70b8b40233 100644
--- a/src/Functions/array/arrayReduce.cpp
+++ b/src/Functions/array/arrayReduce.cpp
@@ -21,7 +21,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int SIZES_OF_ARRAYS_DONT_MATCH;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_COLUMN;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int BAD_ARGUMENTS;
@@ -73,7 +73,7 @@ DataTypePtr FunctionArrayReduce::getReturnTypeImpl(const ColumnsWithTypeAndName
     ///  (possibly with parameters in parentheses, for example: "quantile(0.99)").
 
     if (arguments.size() < 2)
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
             "Number of arguments for function {} doesn't match: passed {}, should be at least 2.",
             getName(), arguments.size());
 
diff --git a/src/Functions/array/arrayZip.cpp b/src/Functions/array/arrayZip.cpp
index 44c323e3fe3..6c6fff5926b 100644
--- a/src/Functions/array/arrayZip.cpp
+++ b/src/Functions/array/arrayZip.cpp
@@ -14,7 +14,7 @@ namespace ErrorCodes
 {
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int SIZES_OF_ARRAYS_DONT_MATCH;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_COLUMN;
 }
 
@@ -39,7 +39,7 @@ public:
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
         if (arguments.empty())
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                 "Function {} needs at least one argument; passed {}." , getName(), arguments.size());
 
         DataTypes arguments_types;
diff --git a/src/Functions/concat.cpp b/src/Functions/concat.cpp
index c75a806559c..68cfcdb8d90 100644
--- a/src/Functions/concat.cpp
+++ b/src/Functions/concat.cpp
@@ -16,7 +16,7 @@ namespace DB
 {
 namespace ErrorCodes
 {
-extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
 }
 
 using namespace GatherUtils;
@@ -48,7 +48,7 @@ public:
     {
         if (arguments.size() < 2)
             throw Exception(
-                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                 "Number of arguments for function {} doesn't match: passed {}, should be at least 2",
                 getName(),
                 arguments.size());
@@ -225,7 +225,7 @@ public:
     {
         if (arguments.empty())
             throw Exception(
-                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                 "Number of arguments for function {} doesn't match: passed {}, should be at least 1.",
                 getName(),
                 arguments.size());
diff --git a/src/Functions/generateULID.cpp b/src/Functions/generateULID.cpp
index 9c5c9403185..f2f2d8ae3b9 100644
--- a/src/Functions/generateULID.cpp
+++ b/src/Functions/generateULID.cpp
@@ -17,7 +17,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
 class FunctionGenerateULID : public IFunction
@@ -45,7 +45,7 @@ public:
     {
         if (arguments.size() > 1)
             throw Exception(
-                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION,
                 "Number of arguments for function {} doesn't match: passed {}, should be 0 or 1.",
                 getName(), arguments.size());
 
diff --git a/src/Functions/jsonMergePatch.cpp b/src/Functions/jsonMergePatch.cpp
index 65946721432..a83daacdbf6 100644
--- a/src/Functions/jsonMergePatch.cpp
+++ b/src/Functions/jsonMergePatch.cpp
@@ -25,7 +25,7 @@ namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
     extern const int ILLEGAL_COLUMN;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -53,7 +53,7 @@ namespace
         DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
         {
             if (arguments.empty())
-                throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Function {} requires at least one argument.", getName());
+                throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} requires at least one argument.", getName());
 
             for (const auto & arg : arguments)
                 if (!isString(arg.type))
diff --git a/src/Functions/nested.cpp b/src/Functions/nested.cpp
index 679bb4f73d8..bdaf57d65c9 100644
--- a/src/Functions/nested.cpp
+++ b/src/Functions/nested.cpp
@@ -18,9 +18,10 @@ namespace DB
 
 namespace ErrorCodes
 {
+    extern const int BAD_ARGUMENTS;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int SIZES_OF_ARRAYS_DONT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
 }
 
 namespace
@@ -64,19 +65,19 @@ public:
     {
         size_t arguments_size = arguments.size();
         if (arguments_size < 2)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                 "Number of arguments for function {} doesn't match: passed {}, should be at least 2",
                 getName(),
                 arguments_size);
 
         Names nested_names = extractNestedNames(arguments[0].column);
         if (nested_names.empty())
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
                 "First argument for function {} must be constant column with array of strings",
                 getName());
 
         if (nested_names.size() != arguments_size - 1)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
                 "Size of nested names array for function {} does not match arrays arguments size. Actual {}. Expected {}",
                 getName(),
                 nested_names.size(),
diff --git a/src/Functions/now64.cpp b/src/Functions/now64.cpp
index 0f1e8a04236..d6f8474c984 100644
--- a/src/Functions/now64.cpp
+++ b/src/Functions/now64.cpp
@@ -18,7 +18,7 @@ namespace ErrorCodes
 {
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int CANNOT_CLOCK_GETTIME;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
 namespace
@@ -128,7 +128,7 @@ public:
 
         if (arguments.size() > 2)
         {
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Arguments size of function {} should be 0, or 1, or 2", getName());
+            throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION, "Arguments size of function {} should be 0, or 1, or 2", getName());
         }
         if (!arguments.empty())
         {
diff --git a/src/Functions/nowInBlock.cpp b/src/Functions/nowInBlock.cpp
index 0d5f9c45780..74f420986c8 100644
--- a/src/Functions/nowInBlock.cpp
+++ b/src/Functions/nowInBlock.cpp
@@ -12,7 +12,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
@@ -63,7 +63,7 @@ public:
     {
         if (arguments.size() > 1)
         {
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Arguments size of function {} should be 0 or 1", getName());
+            throw Exception(ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION, "Arguments size of function {} should be 0 or 1", getName());
         }
         if (arguments.size() == 1 && !isStringOrFixedString(arguments[0].type))
         {
diff --git a/src/Functions/parseTimeDelta.cpp b/src/Functions/parseTimeDelta.cpp
index 7743a0cb664..44eeb1a289f 100644
--- a/src/Functions/parseTimeDelta.cpp
+++ b/src/Functions/parseTimeDelta.cpp
@@ -11,7 +11,8 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
+    extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int BAD_ARGUMENTS;
 }
@@ -117,14 +118,14 @@ namespace
         {
             if (arguments.empty())
                 throw Exception(
-                    ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                    ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION,
                     "Number of arguments for function {} doesn't match: passed {}, should be 1.",
                     getName(),
                     arguments.size());
 
             if (arguments.size() > 1)
                 throw Exception(
-                    ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                    ErrorCodes::TOO_MANY_ARGUMENTS_FOR_FUNCTION,
                     "Number of arguments for function {} doesn't match: passed {}, should be 1.",
                     getName(),
                     arguments.size());
diff --git a/src/Functions/pointInPolygon.cpp b/src/Functions/pointInPolygon.cpp
index 0e4467a8210..55f89b71d6f 100644
--- a/src/Functions/pointInPolygon.cpp
+++ b/src/Functions/pointInPolygon.cpp
@@ -37,7 +37,7 @@ namespace DB
 {
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int BAD_ARGUMENTS;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int ILLEGAL_COLUMN;
@@ -87,7 +87,7 @@ public:
     {
         if (arguments.size() < 2)
         {
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Function {} requires at least 2 arguments", getName());
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} requires at least 2 arguments", getName());
         }
 
         /** We allow function invocation in one of the following forms:
diff --git a/src/TableFunctions/TableFunctionValues.cpp b/src/TableFunctions/TableFunctionValues.cpp
index 7b2a61c25eb..4b56fa57091 100644
--- a/src/TableFunctions/TableFunctionValues.cpp
+++ b/src/TableFunctions/TableFunctionValues.cpp
@@ -25,7 +25,7 @@ namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
     extern const int LOGICAL_ERROR;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
     extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
 }
 
@@ -112,7 +112,7 @@ void TableFunctionValues::parseArguments(const ASTPtr & ast_function, ContextPtr
     ASTs & args = args_func.at(0)->children;
 
     if (args.empty())
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires at least 1 argument", getName());
+        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Table function '{}' requires at least 1 argument", getName());
 
     const auto & literal = args[0]->as<const ASTLiteral>();
     String value;

From cb4f78d9d83de9ec29569652a0d4e6b826e9c0fb Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=D0=9A=D0=B8=D1=80=D0=B8=D0=BB=D0=BB=20=D0=93=D0=B0=D1=80?=
 =?UTF-8?q?=D0=B1=D0=B0=D1=80?= <st087492@student.spbu.ru>
Date: Mon, 6 May 2024 13:04:28 +0300
Subject: [PATCH 077/289] Allow to create MaterializedMySQL database without
 connection

---
 .../MySQL/DatabaseMaterializedMySQL.cpp       |  5 +---
 .../materialized_with_ddl.py                  | 26 +++++++++++++++++++
 .../test_materialized_mysql_database/test.py  |  8 ++++++
 3 files changed, 35 insertions(+), 4 deletions(-)

diff --git a/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp b/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
index d8360a24bcb..6d89cc23590 100644
--- a/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
+++ b/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
@@ -81,12 +81,9 @@ LoadTaskPtr DatabaseMaterializedMySQL::startupDatabaseAsync(AsyncLoader & async_
         base->goals(),
         TablesLoaderBackgroundStartupPoolId,
         fmt::format("startup MaterializedMySQL database {}", getDatabaseName()),
-        [this, mode] (AsyncLoader &, const LoadJobPtr &)
+        [this] (AsyncLoader &, const LoadJobPtr &)
         {
             LOG_TRACE(log, "Starting MaterializeMySQL database");
-            if (mode < LoadingStrictnessLevel::FORCE_ATTACH)
-                materialize_thread.assertMySQLAvailable();
-
             materialize_thread.startSynchronization();
             started_up = true;
         });
diff --git a/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py b/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
index 57f2ccd720d..dcb2546bad3 100644
--- a/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
+++ b/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
@@ -3413,3 +3413,29 @@ def gtid_after_attach_test(clickhouse_node, mysql_node, replication):
         interval_seconds=1,
         retry_count=300,
     )
+
+
+def mysql_create_database_without_connection(clickhouse_node, mysql_node, service_name):
+    mysql_node.query("DROP DATABASE IF EXISTS create_without_connection")
+    clickhouse_node.query("DROP DATABASE IF EXISTS create_without_connection")
+    mysql_node.query("CREATE DATABASE create_without_connection")
+    mysql_node.query(
+        "CREATE TABLE create_without_connection.test ( `id` int(11) NOT NULL, PRIMARY KEY (`id`) ) ENGINE=InnoDB;"
+    )
+
+    clickhouse_node.cluster.pause_container(service_name)
+
+    clickhouse_node.query(
+        "CREATE DATABASE create_without_connection ENGINE = MaterializedMySQL('{}:3306', 'create_without_connection', 'root', 'clickhouse') SETTINGS max_wait_time_when_mysql_unavailable=-1".format(
+            service_name
+        )
+    )
+
+    clickhouse_node.cluster.unpause_container(service_name)
+    mysql_node.alloc_connection()
+
+    check_query(
+        clickhouse_node,
+        "SHOW TABLES FROM create_without_connection FORMAT TSV",
+        "test\n",
+    )
diff --git a/tests/integration/test_materialized_mysql_database/test.py b/tests/integration/test_materialized_mysql_database/test.py
index 57e496fe737..080a850a8c6 100644
--- a/tests/integration/test_materialized_mysql_database/test.py
+++ b/tests/integration/test_materialized_mysql_database/test.py
@@ -721,3 +721,11 @@ def test_binlog_client(started_cluster, started_mysql_8_0, replication):
     materialized_with_ddl.gtid_after_attach_test(
         node_db, started_mysql_8_0, replication
     )
+
+
+def test_create_database_without_mysql_connection(
+    started_cluster, started_mysql_8_0, clickhouse_node: ClickHouseInstance
+):
+    materialized_with_ddl.mysql_create_database_without_connection(
+        clickhouse_node, started_mysql_8_0, "mysql80"
+    )

From 48d6c3760d3890280ce4308e9d51afe9b281232d Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Mon, 6 May 2024 12:05:37 +0000
Subject: [PATCH 078/289] workaround for `oklch()` inside canvas bug for
 firefox

---
 programs/server/dashboard.html | 50 +++++++++++++++++++++++++++++++++-
 1 file changed, 49 insertions(+), 1 deletion(-)

diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index 901211e8ad9..b21d4b86314 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -538,9 +538,57 @@ let params = default_params;
 
 /// Palette generation for charts
 function generatePalette(numColors) {
+    // oklch() does not work in firefox<=125 inside <canvas> element so we convert it back to rgb for now.
+    // Based on https://github.com/color-js/color.js/blob/main/src/spaces/oklch.js
+    const multiplyMatrices = (A, B) => {
+        return [
+            A[0]*B[0] + A[1]*B[1] + A[2]*B[2],
+            A[3]*B[0] + A[4]*B[1] + A[5]*B[2],
+            A[6]*B[0] + A[7]*B[1] + A[8]*B[2]
+        ];
+    }
+
+    const oklch2oklab = ([l, c, h]) => [
+        l,
+        isNaN(h) ? 0 : c * Math.cos(h * Math.PI / 180),
+        isNaN(h) ? 0 : c * Math.sin(h * Math.PI / 180)
+    ]
+
+    const srgbLinear2rgb = rgb => rgb.map(c =>
+        Math.abs(c) > 0.0031308 ?
+            (c < 0 ? -1 : 1) * (1.055 * (Math.abs(c) ** (1 / 2.4)) - 0.055) :
+            12.92 * c
+    )
+
+    const oklab2xyz = lab => {
+        const LMSg = multiplyMatrices([
+            1,  0.3963377773761749,  0.2158037573099136,
+            1, -0.1055613458156586, -0.0638541728258133,
+            1, -0.0894841775298119, -1.2914855480194092,
+        ], lab)
+        const LMS = LMSg.map(val => val ** 3)
+        return multiplyMatrices([
+            1.2268798758459243,  -0.5578149944602171,  0.2813910456659647,
+            -0.0405757452148008,  1.1122868032803170, -0.0717110580655164,
+            -0.0763729366746601, -0.4214933324022432,  1.5869240198367816
+        ], LMS)
+    }
+
+    const xyz2rgbLinear = xyz => {
+        return multiplyMatrices([
+            3.2409699419045226,  -1.537383177570094,   -0.4986107602930034,
+           -0.9692436362808796,   1.8759675015077202,   0.04155505740717559,
+            0.05563007969699366, -0.20397695888897652,  1.0569715142428786
+        ], xyz)
+    }
+
+    const oklch2rgb = lch =>  srgbLinear2rgb(xyz2rgbLinear(oklab2xyz(oklch2oklab(lch))))
+
     palette = [];
     for (let i = 0; i < numColors; i++) {
-        palette.push(`oklch(${theme != 'dark' ? 0.75 : 0.5}, 0.15, ${360 * i / numColors})`);
+        //palette.push(`oklch(${theme != 'dark' ? 0.75 : 0.5}, 0.15, ${360 * i / numColors})`);
+        let rgb = oklch2rgb([theme != 'dark' ? 0.75 : 0.5, 0.15, 360 * i / numColors]);
+        palette.push(`rgb(${rgb[0] * 255}, ${rgb[1] * 255}, ${rgb[2] * 255})`);
     }
     return palette;
 }

From 731d05491cf44d8356f1d6971883004a862fcd0d Mon Sep 17 00:00:00 2001
From: Andrey Zvonov <azvonov@altinity.com>
Date: Mon, 6 May 2024 12:08:02 +0000
Subject: [PATCH 079/289] simplify estimation of number of objects in bucket

---
 src/Storages/StorageS3.cpp | 33 ++++++++++++++-------------------
 src/Storages/StorageS3.h   |  1 -
 2 files changed, 14 insertions(+), 20 deletions(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index cb5734cfe0c..8a4e30fed1d 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -485,12 +485,15 @@ StorageS3Source::KeyWithInfoPtr StorageS3Source::DisclosedGlobIterator::next(siz
 
 size_t StorageS3Source::DisclosedGlobIterator::estimatedKeysCount()
 {
-    return pimpl->objectsCount();
-}
-
-bool StorageS3Source::DisclosedGlobIterator::hasMore()
-{
-    return pimpl->hasMore();
+    if (pimpl->hasMore())
+    {
+        /// 1000 files were listed, and we cannot make any estimation of _how many more_ there are (because we list bucket lazily);
+        /// If there are more objects in the bucket, limiting the number of streams is the last thing we may want to do
+        /// as it would lead to serious (up to <max_threads> times) reading performance degradation.
+        return std::numeric_limits<size_t>::max();
+    }
+    else
+        return pimpl->objectsCount();
 }
 
 class StorageS3Source::KeysIterator::Impl
@@ -1285,21 +1288,13 @@ void ReadFromStorageS3Step::initializePipeline(QueryPipelineBuilder & pipeline,
     createIterator(nullptr);
 
     size_t estimated_keys_count = iterator_wrapper->estimatedKeysCount();
-    const auto glob_iter = std::dynamic_pointer_cast<StorageS3Source::DisclosedGlobIterator>(iterator_wrapper);
-
-    if (!(glob_iter && glob_iter->hasMore()))
+    if (estimated_keys_count > 1)
+        num_streams = std::min(num_streams, estimated_keys_count);
+    else
     {
-        if (estimated_keys_count > 1)
-            num_streams = std::min(num_streams, estimated_keys_count);
-        else
-        {
-            /// The amount of keys (zero) was probably underestimated. We will keep one stream for this particular case.
-            num_streams = 1;
-        }
+        /// The amount of keys (zero) was probably underestimated. We will keep one stream for this particular case.
+        num_streams = 1;
     }
-     /// OTHERWISE, 1000 files were listed, but we cannot make any estimation of _how many_ there are (because we list bucket lazily);
-     /// If there are more objects in the bucket, limiting the number of streams is the last thing we may want to do
-     /// as it would lead to serious (up to <max_threads> times) reading performance degradation.
 
     const size_t max_threads = context->getSettingsRef().max_threads;
     const size_t max_parsing_threads = num_streams >= max_threads ? 1 : (max_threads / std::max(num_streams, 1ul));
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index b841e973a9b..c8ab28fb20e 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -83,7 +83,6 @@ public:
 
         KeyWithInfoPtr next(size_t idx = 0) override; /// NOLINT
         size_t estimatedKeysCount() override;
-        bool hasMore();
 
     private:
         class Impl;

From 9d55bc82d6609633a135a5044f05aadeaff21755 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 6 May 2024 16:19:57 +0200
Subject: [PATCH 080/289] Revert "Revert "Do not remove server constants from
 GROUP BY key for secondary query.""

---
 src/Planner/PlannerExpressionAnalysis.cpp                   | 6 ++++--
 .../03095_group_by_server_constants_bug.reference           | 1 +
 .../0_stateless/03095_group_by_server_constants_bug.sql     | 5 +++++
 3 files changed, 10 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/03095_group_by_server_constants_bug.reference
 create mode 100644 tests/queries/0_stateless/03095_group_by_server_constants_bug.sql

diff --git a/src/Planner/PlannerExpressionAnalysis.cpp b/src/Planner/PlannerExpressionAnalysis.cpp
index ad8db83d66c..d7fa270a643 100644
--- a/src/Planner/PlannerExpressionAnalysis.cpp
+++ b/src/Planner/PlannerExpressionAnalysis.cpp
@@ -85,6 +85,8 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
     bool group_by_use_nulls = planner_context->getQueryContext()->getSettingsRef().group_by_use_nulls &&
         (query_node.isGroupByWithGroupingSets() || query_node.isGroupByWithRollup() || query_node.isGroupByWithCube());
 
+    bool is_secondary_query = planner_context->getQueryContext()->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY;
+
     if (query_node.hasGroupBy())
     {
         if (query_node.isGroupByWithGroupingSets())
@@ -100,7 +102,7 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                     auto is_constant_key = grouping_set_key_node->as<ConstantNode>() != nullptr;
                     group_by_with_constant_keys |= is_constant_key;
 
-                    if (is_constant_key && !aggregates_descriptions.empty())
+                    if (!is_secondary_query && is_constant_key && !aggregates_descriptions.empty())
                         continue;
 
                     auto expression_dag_nodes = actions_visitor.visit(before_aggregation_actions, grouping_set_key_node);
@@ -152,7 +154,7 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                 auto is_constant_key = group_by_key_node->as<ConstantNode>() != nullptr;
                 group_by_with_constant_keys |= is_constant_key;
 
-                if (is_constant_key && !aggregates_descriptions.empty())
+                if (!is_secondary_query && is_constant_key && !aggregates_descriptions.empty())
                     continue;
 
                 auto expression_dag_nodes = actions_visitor.visit(before_aggregation_actions, group_by_key_node);
diff --git a/tests/queries/0_stateless/03095_group_by_server_constants_bug.reference b/tests/queries/0_stateless/03095_group_by_server_constants_bug.reference
new file mode 100644
index 00000000000..80ab3c879bb
--- /dev/null
+++ b/tests/queries/0_stateless/03095_group_by_server_constants_bug.reference
@@ -0,0 +1 @@
+r1	2
diff --git a/tests/queries/0_stateless/03095_group_by_server_constants_bug.sql b/tests/queries/0_stateless/03095_group_by_server_constants_bug.sql
new file mode 100644
index 00000000000..9f9fda1ef62
--- /dev/null
+++ b/tests/queries/0_stateless/03095_group_by_server_constants_bug.sql
@@ -0,0 +1,5 @@
+SELECT serverUUID() AS s, count() FROM remote('127.0.0.{1,2}', system.one) GROUP BY s format Null;
+
+select getMacro('replica') as s, count() from remote('127.0.0.{1,2}', system.one) group by s;
+
+select uptime() as s, count() FROM remote('127.0.0.{1,2}', system.one) group by s format Null;

From c0d2a99a9e5cb02de730fc237166c41b79d84034 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Mon, 6 May 2024 16:51:23 +0200
Subject: [PATCH 081/289] Update date-time-functions.md

---
 .../functions/date-time-functions.md          | 88 +++++++++----------
 1 file changed, 44 insertions(+), 44 deletions(-)

diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 629b3ca9305..493cc9b7648 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -2564,16 +2564,16 @@ Adds a specified number of years to a date, a date with time or a string-encoded
 **Syntax**
 
 ```sql
-addYears(date, x)
+addYears(date, num)
 ```
 
 **Parameters**
 
-- `date`: Date / date with time to add specified number of years to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of years to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date`: Date / date with time to add specified number of years to. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of years to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date` plus `x` years. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date` plus `num` years. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2601,16 +2601,16 @@ Adds a specified number of quarters to a date, a date with time or a string-enco
 **Syntax**
 
 ```sql
-addQuarters(date, x)
+addQuarters(date, num)
 ```
 
 **Parameters**
 
-- `date`: Date / date with time to add specified number of quarters to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of quarters to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date`: Date / date with time to add specified number of quarters to. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of quarters to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date` plus `x` quarters. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date` plus `num` quarters. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2638,16 +2638,16 @@ Adds a specified number of months to a date, a date with time or a string-encode
 **Syntax**
 
 ```sql
-addMonths(date, x)
+addMonths(date, num)
 ```
 
 **Parameters**
 
-- `date`: Date / date with time to add specified number of months to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of months to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date`: Date / date with time to add specified number of months to. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of months to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date` plus `x` months. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date` plus `num` months. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2675,16 +2675,16 @@ Adds a specified number of weeks to a date, a date with time or a string-encoded
 **Syntax**
 
 ```sql
-addWeeks(date, x)
+addWeeks(date, num)
 ```
 
 **Parameters**
 
-- `date`: Date / date with time to add specified number of weeks to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of weeks to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date`: Date / date with time to add specified number of weeks to. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of weeks to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date` plus `x` weeks. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date` plus `num` weeks. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2712,16 +2712,16 @@ Adds a specified number of days to a date, a date with time or a string-encoded
 **Syntax**
 
 ```sql
-addDays(date, x)
+addDays(date, num)
 ```
 
 **Parameters**
 
-- `date`: Date / date with time to add specified number of days to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of days to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date`: Date / date with time to add specified number of days to. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of days to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date` plus `x` days. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date` plus `num` days. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2749,16 +2749,16 @@ Adds a specified number of days to a date, a date with time or a string-encoded
 **Syntax**
 
 ```sql
-addHours(date, x)
+addHours(date, num)
 ```
 
 **Parameters**
 
-- `date`: Date / date with time to add specified number of hours to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of hours to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date`: Date / date with time to add specified number of hours to. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of hours to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date` plus `x` hours. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date` plus `num` hours. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2786,16 +2786,16 @@ Adds a specified number of minutes to a date, a date with time or a string-encod
 **Syntax**
 
 ```sql
-addMinutes(date, x)
+addMinutes(date, num)
 ```
 
 **Parameters**
 
-- `date`: Date / date with time to add specified number of minutes to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of minutes to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date`: Date / date with time to add specified number of minutes to. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of minutes to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date` plus `x` minutes. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date` plus `num` minutes. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2823,16 +2823,16 @@ Adds a specified number of seconds to a date, a date with time or a string-encod
 **Syntax**
 
 ```sql
-addSeconds(date, x)
+addSeconds(date, num)
 ```
 
 **Parameters**
 
-- `date`: Date / date with time to add specified number of seconds to. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of seconds to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date`: Date / date with time to add specified number of seconds to. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of seconds to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date` plus `x` seconds. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date` plus `num` seconds. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2860,16 +2860,16 @@ Adds a specified number of milliseconds to a date with time or a string-encoded
 **Syntax**
 
 ```sql
-addMilliseconds(date_time, x)
+addMilliseconds(date_time, num)
 ```
 
 **Parameters**
 
-- `date_time`: Date with time to add specified number of milliseconds to. [datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of milliseconds to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date_time`: Date with time to add specified number of milliseconds to. [DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of milliseconds to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` plus `x` milliseconds. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date_time` plus `num` milliseconds. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2895,16 +2895,16 @@ Adds a specified number of microseconds to a date with time or a string-encoded
 **Syntax**
 
 ```sql
-addMicroseconds(date_time, x)
+addMicroseconds(date_time, num)
 ```
 
 **Parameters**
 
-- `date_time`: Date with time to add specified number of microseconds to. [datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of microseconds to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date_time`: Date with time to add specified number of microseconds to. [DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of microseconds to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` plus `x` microseconds. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date_time` plus `num` microseconds. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2930,16 +2930,16 @@ Adds a specified number of microseconds to a date with time or a string-encoded
 **Syntax**
 
 ```sql
-addNanoseconds(date_time, x)
+addNanoseconds(date_time, num)
 ```
 
 **Parameters**
 
-- `date_time`: Date with time to add specified number of nanoseconds to. [datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md), [String](../data-types/string.md).
-- `x`: Number of nanoseconds to add. [(U)Int*](../data-types/int-uint.md), [float*](../data-types/float.md).
+- `date_time`: Date with time to add specified number of nanoseconds to. [DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md), [String](../data-types/string.md).
+- `num`: Number of nanoseconds to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` plus `x` nanoseconds. [date](../data-types/date.md)/[date32](../data-types/date32.md)/[datetime](../data-types/datetime.md)/[datetime64](../data-types/datetime64.md).
+- Returns `date_time` plus `num` nanoseconds. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
 
 **Example**
 

From ba4f5f9b3fe74d44295633995033c9d484b8a9c6 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 6 May 2024 19:46:57 +0200
Subject: [PATCH 082/289] Fix backup of parts with projections but without
 projections in metadata

---
 src/Storages/MergeTree/MergeTreeData.cpp      | 42 +++++++++++++---
 ...145_non_loaded_projection_backup.reference |  7 +++
 .../03145_non_loaded_projection_backup.sh     | 49 +++++++++++++++++++
 3 files changed, 92 insertions(+), 6 deletions(-)
 create mode 100644 tests/queries/0_stateless/03145_non_loaded_projection_backup.reference
 create mode 100755 tests/queries/0_stateless/03145_non_loaded_projection_backup.sh

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 9350b24c96a..fbe79a32b8e 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5361,20 +5361,50 @@ MergeTreeData::PartsBackupEntries MergeTreeData::backupParts(
             &temp_dirs,
             false, false);
 
-        auto projection_parts = part->getProjectionParts();
-        for (const auto & [projection_name, projection_part] : projection_parts)
+        auto backup_projection = [&](IDataPartStorage & storage, IMergeTreeDataPart & projection_part)
         {
-            projection_part->getDataPartStorage().backup(
-                projection_part->checksums,
-                projection_part->getFileNamesWithoutChecksums(),
+            storage.backup(
+                projection_part.checksums,
+                projection_part.getFileNamesWithoutChecksums(),
                 fs::path{data_path_in_backup} / part->name,
                 backup_settings,
                 read_settings,
                 make_temporary_hard_links,
                 backup_entries_from_part,
                 &temp_dirs,
-                projection_part->is_broken,
+                projection_part.is_broken,
                 backup_settings.allow_backup_broken_projections);
+        };
+
+        auto projection_parts = part->getProjectionParts();
+        std::string proj_suffix = ".proj";
+        std::unordered_set<String> defined_projections;
+
+        for (const auto & [projection_name, projection_part] : projection_parts)
+        {
+            defined_projections.emplace(projection_name);
+            backup_projection(projection_part->getDataPartStorage(), *projection_part);
+        }
+
+        /// It is possible that the part has a written but not loaded projection,
+        /// e.g. it is written to parent part's checksums.txt and exists on disk,
+        /// but does not exist in table's projections definition.
+        /// Such a part can appear server was restarted after DROP PROJECTION but before old part was removed.
+        /// In this case, the old part will load only projections from metadata.
+        /// See 031145_non_loaded_projection_backup.sh.
+        for (const auto & [name, _] : part->checksums.files)
+        {
+            auto projection_name = fs::path(name).stem().string();
+            if (endsWith(name, proj_suffix) && !defined_projections.contains(projection_name))
+            {
+                auto projection_storage = part->getDataPartStorage().getProjection(projection_name + proj_suffix);
+                if (projection_storage->exists("checksums.txt"))
+                {
+                    auto projection_part = const_cast<IMergeTreeDataPart &>(*part).getProjectionPartBuilder(
+                        projection_name, /* is_temp_projection */false).withPartFormatFromDisk().build();
+                    backup_projection(projection_part->getDataPartStorage(), *projection_part);
+                }
+            }
         }
 
         if (hold_storage_and_part_ptrs)
diff --git a/tests/queries/0_stateless/03145_non_loaded_projection_backup.reference b/tests/queries/0_stateless/03145_non_loaded_projection_backup.reference
new file mode 100644
index 00000000000..a11ee210e62
--- /dev/null
+++ b/tests/queries/0_stateless/03145_non_loaded_projection_backup.reference
@@ -0,0 +1,7 @@
+7
+Found unexpected projection directories: pp.proj
+BACKUP_CREATED
+RESTORED
+7
+Found unexpected projection directories: pp.proj
+0
diff --git a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
new file mode 100755
index 00000000000..721ed784fc2
--- /dev/null
+++ b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
@@ -0,0 +1,49 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -nm -q "
+drop table if exists tp_1;
+create table tp_1 (x Int32, y Int32, projection p (select x, y order by x)) engine = MergeTree order by y partition by intDiv(y, 100);
+insert into tp_1 select number, number from numbers(3);
+
+set mutations_sync = 2;
+
+alter table tp_1 add projection pp (select x, count() group by x);
+insert into tp_1 select number, number from numbers(4);
+select count() from tp_1;
+
+-- Here we have a part with written projection pp
+alter table tp_1 detach partition '0';
+-- Move part to detached
+alter table tp_1 clear projection pp;
+-- Remove projection from table metadata
+alter table tp_1 drop projection pp;
+-- Now, we don't load projection pp for attached part, but it is written on disk
+alter table tp_1 attach partition '0';
+"
+
+$CLICKHOUSE_CLIENT -nm -q "
+set send_logs_level='fatal';
+check table tp_1 settings check_query_single_value_result = 0;" | grep -o "Found unexpected projection directories: pp.proj"
+
+backup_id="$CLICKHOUSE_TEST_UNIQUE_NAME"
+$CLICKHOUSE_CLIENT -q "
+backup table tp_1 to Disk('backups', '$backup_id');
+" | grep -o "BACKUP_CREATED"
+
+$CLICKHOUSE_CLIENT -nm -q "
+drop table tp_1;
+restore table tp_1 from Disk('backups', '$backup_id');
+" | grep -o "RESTORED"
+
+$CLICKHOUSE_CLIENT -q "select count() from tp_1;"
+$CLICKHOUSE_CLIENT -nm -q "
+set send_logs_level='fatal';
+check table tp_1 settings check_query_single_value_result = 0;" | grep -o "Found unexpected projection directories: pp.proj"
+$CLICKHOUSE_CLIENT -nm -q "
+set send_logs_level='fatal';
+check table tp_1"
+$CLICKHOUSE_CLIENT -q "drop table tp_1 sync"

From 0b0e97917e3e4ab27a17cbf14d9e73163a20adbe Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 6 May 2024 21:03:04 +0200
Subject: [PATCH 083/289] Do in reverse order

---
 src/Storages/MergeTree/MergeTreeRangeReader.cpp | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeRangeReader.cpp b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
index eb757e1d8c7..492e4065502 100644
--- a/src/Storages/MergeTree/MergeTreeRangeReader.cpp
+++ b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
@@ -1007,6 +1007,10 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
                 filterColumns(columns, read_result.final_filter);
             }
 
+            /// If columns not empty, then apply on-fly alter conversions if any required
+            if (!prewhere_info || prewhere_info->perform_alter_conversions)
+                merge_tree_reader->performRequiredConversions(columns);
+
             /// If some columns absent in part, then evaluate default values
             if (should_evaluate_missing_defaults)
             {
@@ -1018,9 +1022,6 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
                 merge_tree_reader->evaluateMissingDefaults(additional_columns, columns);
             }
 
-            /// If columns not empty, then apply on-fly alter conversions if any required
-            if (!prewhere_info || prewhere_info->perform_alter_conversions)
-                merge_tree_reader->performRequiredConversions(columns);
         }
 
         read_result.columns.reserve(read_result.columns.size() + columns.size());
@@ -1046,14 +1047,14 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
             bool should_evaluate_missing_defaults;
             merge_tree_reader->fillMissingColumns(columns, should_evaluate_missing_defaults, read_result.num_rows);
 
-            /// If some columns absent in part, then evaluate default values
-            if (should_evaluate_missing_defaults)
-                merge_tree_reader->evaluateMissingDefaults({}, columns);
-
             /// If result not empty, then apply on-fly alter conversions if any required
             if (!prewhere_info || prewhere_info->perform_alter_conversions)
                 merge_tree_reader->performRequiredConversions(columns);
 
+            /// If some columns absent in part, then evaluate default values
+            if (should_evaluate_missing_defaults)
+                merge_tree_reader->evaluateMissingDefaults({}, columns);
+
             for (size_t i = 0; i < columns.size(); ++i)
                 read_result.columns[i] = std::move(columns[i]);
         }

From 1b7b4fc858fe7918d274691d233b69df701654fa Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Mon, 6 May 2024 22:08:13 +0300
Subject: [PATCH 084/289] removed unnecessary setting

---
 src/Core/Settings.h            |  1 -
 src/Interpreters/HashJoin.cpp  | 12 ++++++------
 src/Interpreters/TableJoin.cpp |  1 -
 src/Interpreters/TableJoin.h   |  3 ---
 4 files changed, 6 insertions(+), 11 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 5dc80912ebb..7ed175d38f4 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -463,7 +463,6 @@ class IColumn;
     M(UInt64, partial_merge_join_rows_in_right_blocks, 65536, "Split right-hand joining data in blocks of specified size. It's a portion of data indexed by min-max values and possibly unloaded on disk.", 0) \
     M(UInt64, join_on_disk_max_files_to_merge, 64, "For MergeJoin on disk set how much files it's allowed to sort simultaneously. Then this value bigger then more memory used and then less disk I/O needed. Minimum is 2.", 0) \
     M(UInt64, max_rows_in_set_to_optimize_join, 0, "Maximal size of the set to filter joined tables by each other row sets before joining. 0 - disable.", 0) \
-    M(UInt64, cross_join_max_bytes_inmemory, 1000000, "Maximal bytes to complete cross join inmemory.", 0) \
     \
     M(Bool, compatibility_ignore_collation_in_create_table, true, "Compatibility ignore collation in create table", 0) \
     \
diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index e194df4e660..52c804c261a 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -2309,6 +2309,12 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
             }
         };
 
+        for (const Block & compressed_block_right : data->blocks)
+        {
+            auto block_right = compressed_block_right.decompress();
+            process_right_block(block_right);
+        }
+
         if (tmp_stream)
         {
             tmp_stream->finishWritingAsyncSafe();
@@ -2319,12 +2325,6 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
             }
         }
 
-        for (const Block & compressed_block_right : data->blocks)
-        {
-            auto block_right = compressed_block_right.decompress();
-            process_right_block(block_right);
-        }
-
         start_right_block = 0;
 
         if (rows_added > max_joined_block_rows)
diff --git a/src/Interpreters/TableJoin.cpp b/src/Interpreters/TableJoin.cpp
index 7ceb90704f3..1ee8ca14b2f 100644
--- a/src/Interpreters/TableJoin.cpp
+++ b/src/Interpreters/TableJoin.cpp
@@ -111,7 +111,6 @@ TableJoin::TableJoin(const Settings & settings, VolumePtr tmp_volume_, Temporary
     , cross_join_min_bytes_to_compress(settings.cross_join_min_bytes_to_compress)
     , max_joined_block_rows(settings.max_joined_block_size_rows)
     , join_algorithm(settings.join_algorithm)
-    , cross_join_max_bytes_inmemory(settings.cross_join_max_bytes_inmemory)
     , partial_merge_join_rows_in_right_blocks(settings.partial_merge_join_rows_in_right_blocks)
     , partial_merge_join_left_table_buffer_bytes(settings.partial_merge_join_left_table_buffer_bytes)
     , max_files_to_merge(settings.join_on_disk_max_files_to_merge)
diff --git a/src/Interpreters/TableJoin.h b/src/Interpreters/TableJoin.h
index d6920d6afbf..8e83233e54c 100644
--- a/src/Interpreters/TableJoin.h
+++ b/src/Interpreters/TableJoin.h
@@ -145,7 +145,6 @@ private:
     const UInt64 cross_join_min_bytes_to_compress = 10000;
     const size_t max_joined_block_rows = 0;
     std::vector<JoinAlgorithm> join_algorithm;
-    const UInt64 cross_join_max_bytes_inmemory = 1000000;
     const size_t partial_merge_join_rows_in_right_blocks = 0;
     const size_t partial_merge_join_left_table_buffer_bytes = 0;
     const size_t max_files_to_merge = 0;
@@ -281,8 +280,6 @@ public:
 
     bool allowParallelHashJoin() const;
 
-    UInt64 crossJoinMaxBytesInmemory() const { return cross_join_max_bytes_inmemory; }
-
     bool joinUseNulls() const { return join_use_nulls; }
 
     UInt64 crossJoinMinRowsToCompress() const { return cross_join_min_rows_to_compress; }

From 670c8c11886ee5763639bccb28cf45f74f683c05 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Mon, 6 May 2024 21:42:25 +0200
Subject: [PATCH 085/289] fix exception

---
 src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp b/src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp
index 6b60faadf07..16646c702bf 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionArray.cpp
@@ -26,7 +26,7 @@ public:
     DataTypes transformArguments(const DataTypes & arguments) const override
     {
         if (arguments.empty())
-            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "-Array aggregate functions require at least one argument");
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Array aggregate functions require at least one argument");
 
         DataTypes nested_arguments;
         for (const auto & type : arguments)

From 1660a4fe867d3d8d5e2fb0167c689f936226cfde Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Mon, 6 May 2024 23:22:41 +0300
Subject: [PATCH 086/289] first working version

---
 src/Interpreters/HashJoin.cpp | 24 +++++++++++++++++++-----
 1 file changed, 19 insertions(+), 5 deletions(-)

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 52c804c261a..68186c00663 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -64,6 +64,7 @@ struct NotProcessedCrossJoin : public ExtraBlock
 {
     size_t left_position;
     size_t right_block;
+    std::unique_ptr<InputReader> reader;
 };
 
 
@@ -256,7 +257,6 @@ HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_s
     , instance_log_id(!instance_id_.empty() ? "(" + instance_id_ + ") " : "")
     , log(getLogger("HashJoin"))
 {
-    LOG_INFO(log, "KEK CONSTRUCTOR {}\n", reserve_num);
     LOG_TRACE(log, "{}Keys: {}, datatype: {}, kind: {}, strictness: {}, right header: {}",
         instance_log_id, TableJoin::formatClauses(table_join->getClauses(), true), data->type, kind, strictness, right_sample_block.dumpStructure());
 
@@ -830,14 +830,23 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
     if (shrink_blocks)
         block_to_save = block_to_save.shrinkToFit();
 
+    size_t max_bytes_in_join = table_join->sizeLimits().max_bytes;
+    size_t max_rows_in_join = table_join->sizeLimits().max_rows;
+    if (!table_join->sizeLimits().hasLimits())
+    {
+        max_bytes_in_join = table_join->defaultMaxBytes();
+    }
 
-    if (kind == JoinKind::Cross)
+    if (kind == JoinKind::Cross
+        && (tmp_stream || (max_bytes_in_join && getTotalByteCount() + block_to_save.allocatedBytes() >= max_bytes_in_join)
+            || (max_rows_in_join && getTotalRowCount() + block_to_save.rows() >= max_rows_in_join)))
     {
         if (tmp_stream == nullptr)
         {
             tmp_stream = &tmp_data->createStream(right_sample_block);
         }
         tmp_stream->write(block_to_save);
+        return true;
     }
 
     size_t total_rows = 0;
@@ -2251,11 +2260,13 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
 {
     size_t start_left_row = 0;
     size_t start_right_block = 0;
+    std::unique_ptr<InputReader> reader = nullptr;
     if (not_processed)
     {
         auto & continuation = static_cast<NotProcessedCrossJoin &>(*not_processed);
         start_left_row = continuation.left_position;
         start_right_block = continuation.right_block;
+        reader = std::move(continuation.reader);
         not_processed.reset();
     }
 
@@ -2317,8 +2328,11 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
 
         if (tmp_stream)
         {
-            tmp_stream->finishWritingAsyncSafe();
-            auto reader = tmp_stream->getReadStream();
+            if (reader == nullptr)
+            {
+                tmp_stream->finishWritingAsyncSafe();
+                reader = tmp_stream->getReadStream();
+            }
             while (auto block_right = reader->read())
             {
                 process_right_block(block_right);
@@ -2330,7 +2344,7 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
         if (rows_added > max_joined_block_rows)
         {
             not_processed = std::make_shared<NotProcessedCrossJoin>(
-                NotProcessedCrossJoin{{block.cloneEmpty()}, left_row, block_number + 1});
+                NotProcessedCrossJoin{{block.cloneEmpty()}, left_row, block_number + 1, std::move(reader)});
             not_processed->block.swap(block);
             break;
         }

From 3dd04e4e58585bd467fc3549200b9759886f8a88 Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Mon, 6 May 2024 23:27:28 +0300
Subject: [PATCH 087/289] removed garbage

---
 src/Interpreters/GraceHashJoin.cpp | 1 -
 src/Interpreters/HashJoin.h        | 9 ---------
 2 files changed, 10 deletions(-)

diff --git a/src/Interpreters/GraceHashJoin.cpp b/src/Interpreters/GraceHashJoin.cpp
index ba51953e979..53d1f48c291 100644
--- a/src/Interpreters/GraceHashJoin.cpp
+++ b/src/Interpreters/GraceHashJoin.cpp
@@ -657,7 +657,6 @@ IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
 
 GraceHashJoin::InMemoryJoinPtr GraceHashJoin::makeInMemoryJoin(const String & bucket_id, size_t reserve_num)
 {
-    LOG_INFO(log, "GreaceHashJoin\n");
     return std::make_unique<HashJoin>(table_join, right_sample_block, any_take_last_row, reserve_num, bucket_id);
 }
 
diff --git a/src/Interpreters/HashJoin.h b/src/Interpreters/HashJoin.h
index 1eb4d0f8030..04a04b74dd0 100644
--- a/src/Interpreters/HashJoin.h
+++ b/src/Interpreters/HashJoin.h
@@ -415,15 +415,6 @@ public:
 
     void setMaxJoinedBlockRows(size_t value) { max_joined_block_rows = value; }
 
-    TemporaryFileStream* getStreamForCrossJoin()
-    {
-        auto streams = tmp_data->getStreams();
-        assert(streams.size() <= 1);
-        if (streams.empty())
-            return nullptr;
-        return streams[0];
-    }
-
 private:
     friend class NotJoinedHash;
 

From d4a0325350673a89e874d4f3a5a1500044587ced Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Mon, 6 May 2024 23:30:27 +0300
Subject: [PATCH 088/289] added check that tmp_data is not nullptr

---
 src/Interpreters/HashJoin.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 68186c00663..f4408271fbf 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -837,7 +837,7 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
         max_bytes_in_join = table_join->defaultMaxBytes();
     }
 
-    if (kind == JoinKind::Cross
+    if (kind == JoinKind::Cross && tmp_data
         && (tmp_stream || (max_bytes_in_join && getTotalByteCount() + block_to_save.allocatedBytes() >= max_bytes_in_join)
             || (max_rows_in_join && getTotalRowCount() + block_to_save.rows() >= max_rows_in_join)))
     {

From d531e2006d9326bce2877efda9823aa880e4c8cb Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Tue, 7 May 2024 00:10:24 +0300
Subject: [PATCH 089/289] Deleted check of read type and added comment

---
 src/Interpreters/TemporaryDataOnDisk.cpp | 12 ------------
 src/Interpreters/TemporaryDataOnDisk.h   |  5 +----
 2 files changed, 1 insertion(+), 16 deletions(-)

diff --git a/src/Interpreters/TemporaryDataOnDisk.cpp b/src/Interpreters/TemporaryDataOnDisk.cpp
index e50d501f6d3..9bd0fa9e8ed 100644
--- a/src/Interpreters/TemporaryDataOnDisk.cpp
+++ b/src/Interpreters/TemporaryDataOnDisk.cpp
@@ -331,12 +331,6 @@ Block TemporaryFileStream::read()
     if (isEof())
         return {};
 
-    if (auto type = read_type.exchange(1); type == 2)
-    {
-        read_type.store(2);
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Different type of reading was requested earlier");
-    }
-
     if (!in_reader)
     {
         in_reader = std::make_unique<InputReader>(getPath(), header, getSize());
@@ -360,12 +354,6 @@ std::unique_ptr<InputReader> TemporaryFileStream::getReadStream()
     if (isEof())
         return nullptr;
 
-    if (auto type = read_type.exchange(2); type == 1)
-    {
-        read_type.store(1);
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Different type of reading was requested earlier");
-    }
-
     return std::make_unique<InputReader>(getPath(), header, getSize());
 }
 
diff --git a/src/Interpreters/TemporaryDataOnDisk.h b/src/Interpreters/TemporaryDataOnDisk.h
index 792988e94bd..a5141dd373e 100644
--- a/src/Interpreters/TemporaryDataOnDisk.h
+++ b/src/Interpreters/TemporaryDataOnDisk.h
@@ -149,7 +149,7 @@ struct InputReader
 
 /*
  * Data can be written into this stream and then read.
- * After finish writing, call `finishWriting` and then `read` to read the data.
+ * After finish writing, call `finishWriting` and then either call `read` or 'getReadStream'(only one of the two) to read the data.
  * Account amount of data written to disk in parent scope.
  */
 class TemporaryFileStream : boost::noncopyable
@@ -204,9 +204,6 @@ private:
 
     Stat stat;
 
-    /// 0 - means that we haven't requested any read, 1 - read from function TemporaryFileStream::read, 2 - 
-    std::atomic_char read_type{0};
-
     mutable std::mutex finish_writing;
     std::atomic_bool writing_finished{false};
 

From 9fcb5d2ebfb3e2105b5d6171a1a53ff75c0023f4 Mon Sep 17 00:00:00 2001
From: Yohann Jardin <yohann.jardin@telecomnancy.net>
Date: Mon, 6 May 2024 23:44:27 +0200
Subject: [PATCH 090/289] Move ErrorCodes inside DB namespace

---
 .../AggregateFunctionMannWhitney.cpp                   | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp b/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
index d185058dbd0..8434f11eae6 100644
--- a/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
@@ -17,6 +17,11 @@
 #include <boost/math/distributions/normal.hpp>
 
 
+namespace DB
+{
+
+struct Settings;
+
 namespace ErrorCodes
 {
     extern const int NOT_IMPLEMENTED;
@@ -25,11 +30,6 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
 }
 
-namespace DB
-{
-
-struct Settings;
-
 namespace
 {
 

From 4703eb943b9586be7cab2429a170d9cf9131558f Mon Sep 17 00:00:00 2001
From: Yohann Jardin <yohann.jardin@telecomnancy.net>
Date: Mon, 6 May 2024 23:59:59 +0200
Subject: [PATCH 091/289] Move ErrorCodes inside DB namespace

---
 src/AggregateFunctions/AggregateFunctionWelchTTest.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionWelchTTest.cpp b/src/AggregateFunctions/AggregateFunctionWelchTTest.cpp
index 7f1c4861fbc..7efd6154227 100644
--- a/src/AggregateFunctions/AggregateFunctionWelchTTest.cpp
+++ b/src/AggregateFunctions/AggregateFunctionWelchTTest.cpp
@@ -4,16 +4,16 @@
 #include <AggregateFunctions/Moments.h>
 
 
+namespace DB
+{
+struct Settings;
+
 namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
     extern const int TOO_MANY_ARGUMENTS_FOR_FUNCTION;
 }
 
-namespace DB
-{
-struct Settings;
-
 namespace
 {
 

From d14fc62d4d4b597435e482f60a2f7c83412e53cc Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Fri, 29 Mar 2024 08:59:07 +0000
Subject: [PATCH 092/289] Avoid crashing on column type mismatch in a few dozen
 places

---
 src/Columns/ColumnArray.cpp                   |  2 +-
 src/Columns/ColumnLowCardinality.cpp          |  2 +-
 src/Columns/ColumnUnique.h                    |  4 +-
 src/Columns/FilterDescription.cpp             |  4 +-
 src/Columns/IColumn.h                         |  8 +++-
 src/Columns/MaskOperations.cpp                |  4 +-
 src/Common/ColumnsHashing.h                   | 12 +++---
 src/Common/ColumnsHashingImpl.h               |  2 +-
 src/Core/DecimalComparison.h                  | 16 ++++----
 src/DataTypes/ObjectUtils.cpp                 |  2 +-
 .../Serializations/SerializationBool.cpp      |  4 +-
 .../Serializations/SerializationInterval.cpp  |  2 +-
 .../SerializationLowCardinality.cpp           |  2 +-
 .../HierarchyDictionariesUtils.cpp            |  8 ++--
 src/Formats/insertNullAsDefaultIfNeeded.cpp   | 40 +++++++++----------
 src/Functions/FunctionBase64Conversion.h      |  4 +-
 src/Functions/FunctionBinaryArithmetic.h      | 20 +++++-----
 src/Functions/FunctionHelpers.cpp             | 10 ++---
 src/Functions/FunctionHelpers.h               | 25 +++++++++++-
 src/Functions/FunctionUnixTimestamp64.h       |  2 +-
 src/Functions/FunctionsBitmap.h               |  4 +-
 src/Functions/FunctionsCodingIP.cpp           |  4 +-
 src/Functions/FunctionsConversion.cpp         |  2 +-
 src/Functions/FunctionsRound.h                | 18 ++++-----
 src/Functions/FunctionsStringHash.h           | 12 +++---
 src/Functions/Kusto/KqlArraySort.cpp          |  4 +-
 src/Functions/MultiMatchAllIndicesImpl.h      |  4 +-
 src/Functions/MultiMatchAnyImpl.h             |  4 +-
 src/Functions/MultiSearchAllPositionsImpl.h   |  4 +-
 src/Functions/MultiSearchFirstIndexImpl.h     |  4 +-
 src/Functions/MultiSearchFirstPositionImpl.h  |  4 +-
 src/Functions/MultiSearchImpl.h               |  4 +-
 .../URL/FirstSignificantSubdomainCustomImpl.h |  2 +-
 src/Functions/array/FunctionArrayMapped.h     |  2 +-
 src/Functions/array/arrayCompact.cpp          |  2 +-
 src/Functions/array/arrayDistinct.cpp         |  8 ++--
 src/Functions/array/arrayElement.cpp          |  6 +--
 src/Functions/array/arrayEnumerateExtended.h  |  2 +-
 src/Functions/array/arrayIndex.h              | 10 ++---
 src/Functions/array/arrayJaccardIndex.cpp     |  8 ++--
 src/Functions/array/arrayUniq.cpp             |  2 +-
 src/Functions/array/emptyArrayToSingle.cpp    |  2 +-
 src/Functions/array/range.cpp                 |  6 +--
 src/Functions/arrayStringConcat.cpp           |  2 +-
 src/Functions/assumeNotNull.cpp               |  2 +-
 src/Functions/coalesce.cpp                    | 10 ++---
 src/Functions/fromModifiedJulianDay.cpp       |  4 +-
 src/Functions/grouping.h                      |  4 +-
 src/Functions/hasColumnInTable.cpp            |  4 +-
 src/Functions/if.cpp                          | 18 ++++-----
 src/Functions/isNotNull.cpp                   | 14 +++----
 src/Functions/isNull.cpp                      | 14 +++----
 src/Functions/minSampleSize.cpp               |  8 ++--
 src/Functions/multiIf.cpp                     |  2 +-
 src/Functions/readWkt.cpp                     |  4 +-
 src/Functions/repeat.cpp                      |  8 ++--
 src/Functions/seriesOutliersDetectTukey.cpp   |  6 +--
 src/Functions/seriesPeriodDetectFFT.cpp       |  6 +--
 src/Functions/space.cpp                       |  6 +--
 src/Functions/toStartOfInterval.cpp           |  6 +--
 src/Functions/ztest.cpp                       | 12 +++---
 src/Interpreters/BloomFilterHash.h            |  2 +-
 src/Interpreters/HashJoin.cpp                 |  2 +-
 src/Interpreters/InterpreterCheckQuery.cpp    |  6 +--
 src/Interpreters/JoinUtils.cpp                | 20 +++++-----
 src/Interpreters/MergeJoin.cpp                |  8 ++--
 src/Interpreters/NullableUtils.cpp            |  4 +-
 src/Interpreters/SetVariants.cpp              |  2 +-
 src/Interpreters/SetVariants.h                |  2 +-
 .../Transforms/CheckConstraintsTransform.cpp  |  2 +-
 .../Transforms/MergeJoinTransform.cpp         |  8 ++--
 src/Processors/Transforms/WindowTransform.cpp |  2 +-
 src/Storages/MergeTree/MergeTreeIndexSet.cpp  |  2 +-
 73 files changed, 253 insertions(+), 228 deletions(-)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index 7b268b80116..8d5c246c48c 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -1283,7 +1283,7 @@ ColumnPtr ColumnArray::replicateTuple(const Offsets & replicate_offsets) const
 
 size_t ColumnArray::getNumberOfDimensions() const
 {
-    const auto * nested_array = checkAndGetColumn<ColumnArray>(*data);
+    const auto * nested_array = checkAndGetColumn<ColumnArray>(&*data);
     if (!nested_array)
         return 1;
     return 1 + nested_array->getNumberOfDimensions();   /// Every modern C++ compiler optimizes tail recursion.
diff --git a/src/Columns/ColumnLowCardinality.cpp b/src/Columns/ColumnLowCardinality.cpp
index a3696c78669..a032c2b25b7 100644
--- a/src/Columns/ColumnLowCardinality.cpp
+++ b/src/Columns/ColumnLowCardinality.cpp
@@ -903,7 +903,7 @@ ColumnPtr ColumnLowCardinality::cloneWithDefaultOnNull() const
 
 bool isColumnLowCardinalityNullable(const IColumn & column)
 {
-    if (const auto * lc_column = checkAndGetColumn<ColumnLowCardinality>(column))
+    if (const auto * lc_column = checkAndGetColumn<ColumnLowCardinality>(&column))
         return lc_column->nestedIsNullable();
     return false;
 }
diff --git a/src/Columns/ColumnUnique.h b/src/Columns/ColumnUnique.h
index a8873140817..0311efd4c83 100644
--- a/src/Columns/ColumnUnique.h
+++ b/src/Columns/ColumnUnique.h
@@ -376,7 +376,7 @@ size_t ColumnUnique<ColumnType>::uniqueInsertFrom(const IColumn & src, size_t n)
     if (is_nullable && src.isNullAt(n))
         return getNullValueIndex();
 
-    if (const auto * nullable = checkAndGetColumn<ColumnNullable>(src))
+    if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&src))
         return uniqueInsertFrom(nullable->getNestedColumn(), n);
 
     auto ref = src.getDataAt(n);
@@ -569,7 +569,7 @@ MutableColumnPtr ColumnUnique<ColumnType>::uniqueInsertRangeImpl(
         return nullptr;
     };
 
-    if (const auto * nullable_column = checkAndGetColumn<ColumnNullable>(src))
+    if (const auto * nullable_column = checkAndGetColumn<ColumnNullable>(&src))
     {
         src_column = typeid_cast<const ColumnType *>(&nullable_column->getNestedColumn());
         null_map = &nullable_column->getNullMapData();
diff --git a/src/Columns/FilterDescription.cpp b/src/Columns/FilterDescription.cpp
index 62d2babe17a..56c99a5b49c 100644
--- a/src/Columns/FilterDescription.cpp
+++ b/src/Columns/FilterDescription.cpp
@@ -32,7 +32,7 @@ ConstantFilterDescription::ConstantFilterDescription(const IColumn & column)
 
         if (!typeid_cast<const ColumnUInt8 *>(column_nested.get()))
         {
-            const ColumnNullable * column_nested_nullable = checkAndGetColumn<ColumnNullable>(*column_nested);
+            const ColumnNullable * column_nested_nullable = checkAndGetColumn<ColumnNullable>(&*column_nested);
             if (!column_nested_nullable || !typeid_cast<const ColumnUInt8 *>(&column_nested_nullable->getNestedColumn()))
             {
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_COLUMN_FOR_FILTER,
@@ -66,7 +66,7 @@ FilterDescription::FilterDescription(const IColumn & column_)
         return;
     }
 
-    if (const auto * nullable_column = checkAndGetColumn<ColumnNullable>(column))
+    if (const auto * nullable_column = checkAndGetColumn<ColumnNullable>(&column))
     {
         ColumnPtr nested_column = nullable_column->getNestedColumnPtr();
         MutableColumnPtr mutable_holder = IColumn::mutate(std::move(nested_column));
diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index cea8d7c9f55..cf2693e008c 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -640,12 +640,16 @@ template <>
 struct IsMutableColumns<> { static const bool value = true; };
 
 
+/// Throws LOGICAL_ERROR if the type doesn't match.
 template <typename Type>
-const Type * checkAndGetColumn(const IColumn & column)
+const Type & checkAndGetColumn(const IColumn & column)
 {
-    return typeid_cast<const Type *>(&column);
+    return typeid_cast<const Type &>(column);
 }
 
+/// Returns nullptr if the type doesn't match.
+/// If you're going to dereference the returned pointer without checking for null, use the
+/// `const IColumn &` overload above instead.
 template <typename Type>
 const Type * checkAndGetColumn(const IColumn * column)
 {
diff --git a/src/Columns/MaskOperations.cpp b/src/Columns/MaskOperations.cpp
index 8f5299cf6e8..2c54a416850 100644
--- a/src/Columns/MaskOperations.cpp
+++ b/src/Columns/MaskOperations.cpp
@@ -205,10 +205,10 @@ static MaskInfo extractMaskImpl(
     auto column = col->convertToFullColumnIfLowCardinality();
 
     /// Special implementation for Null and Const columns.
-    if (column->onlyNull() || checkAndGetColumn<ColumnConst>(*column))
+    if (column->onlyNull() || checkAndGetColumn<ColumnConst>(&*column))
         return extractMaskFromConstOrNull<inverted>(mask, column, null_value, nulls);
 
-    if (const auto * nullable_column = checkAndGetColumn<ColumnNullable>(*column))
+    if (const auto * nullable_column = checkAndGetColumn<ColumnNullable>(&*column))
     {
         const PaddedPODArray<UInt8> & null_map = nullable_column->getNullMapData();
         return extractMaskImpl<inverted>(mask, nullable_column->getNestedColumnPtr(), null_value, &null_map, nulls);
diff --git a/src/Common/ColumnsHashing.h b/src/Common/ColumnsHashing.h
index 25d2ddc684d..bd3880eb83b 100644
--- a/src/Common/ColumnsHashing.h
+++ b/src/Common/ColumnsHashing.h
@@ -44,8 +44,8 @@ struct HashMethodOneNumber
     {
         if constexpr (nullable)
         {
-            const auto * null_column = checkAndGetColumn<ColumnNullable>(key_columns[0]);
-            vec = null_column->getNestedColumnPtr()->getRawData().data();
+            const auto & null_column = checkAndGetColumn<ColumnNullable>(*key_columns[0]);
+            vec = null_column.getNestedColumnPtr()->getRawData().data();
         }
         else
         {
@@ -57,8 +57,8 @@ struct HashMethodOneNumber
     {
         if constexpr (nullable)
         {
-            const auto * null_column = checkAndGetColumn<ColumnNullable>(column);
-            vec = null_column->getNestedColumnPtr()->getRawData().data();
+            const auto & null_column = checkAndGetColumn<ColumnNullable>(*column);
+            vec = null_column.getNestedColumnPtr()->getRawData().data();
         }
         else
         {
@@ -105,7 +105,7 @@ struct HashMethodString
         const IColumn * column;
         if constexpr (nullable)
         {
-            column = checkAndGetColumn<ColumnNullable>(key_columns[0])->getNestedColumnPtr().get();
+            column = checkAndGetColumn<ColumnNullable>(*key_columns[0]).getNestedColumnPtr().get();
         }
         else
         {
@@ -153,7 +153,7 @@ struct HashMethodFixedString
         const IColumn * column;
         if constexpr (nullable)
         {
-            column = checkAndGetColumn<ColumnNullable>(key_columns[0])->getNestedColumnPtr().get();
+            column = checkAndGetColumn<ColumnNullable>(*key_columns[0]).getNestedColumnPtr().get();
         }
         else
         {
diff --git a/src/Common/ColumnsHashingImpl.h b/src/Common/ColumnsHashingImpl.h
index 6b3cc24d870..f74a56292ae 100644
--- a/src/Common/ColumnsHashingImpl.h
+++ b/src/Common/ColumnsHashingImpl.h
@@ -305,7 +305,7 @@ protected:
         }
 
         if constexpr (nullable)
-            null_map = &checkAndGetColumn<ColumnNullable>(column)->getNullMapColumn();
+            null_map = &checkAndGetColumn<ColumnNullable>(*column).getNullMapColumn();
     }
 
     template <typename Data, typename KeyHolder>
diff --git a/src/Core/DecimalComparison.h b/src/Core/DecimalComparison.h
index 08569aa534c..63817e77805 100644
--- a/src/Core/DecimalComparison.h
+++ b/src/Core/DecimalComparison.h
@@ -170,11 +170,11 @@ private:
 
             if (c0_is_const && c1_is_const)
             {
-                const ColumnConst * c0_const = checkAndGetColumnConst<ColVecA>(c0.get());
-                const ColumnConst * c1_const = checkAndGetColumnConst<ColVecB>(c1.get());
+                const ColumnConst & c0_const = checkAndGetColumnConst<ColVecA>(*c0);
+                const ColumnConst & c1_const = checkAndGetColumnConst<ColVecB>(*c1);
 
-                A a = c0_const->template getValue<A>();
-                B b = c1_const->template getValue<B>();
+                A a = c0_const.template getValue<A>();
+                B b = c1_const.template getValue<B>();
                 UInt8 res = apply<scale_left, scale_right>(a, b, scale);
                 return DataTypeUInt8().createColumnConst(c0->size(), toField(res));
             }
@@ -184,8 +184,8 @@ private:
 
             if (c0_is_const)
             {
-                const ColumnConst * c0_const = checkAndGetColumnConst<ColVecA>(c0.get());
-                A a = c0_const->template getValue<A>();
+                const ColumnConst & c0_const = checkAndGetColumnConst<ColVecA>(*c0);
+                A a = c0_const.template getValue<A>();
                 if (const ColVecB * c1_vec = checkAndGetColumn<ColVecB>(c1.get()))
                     constantVector<scale_left, scale_right>(a, c1_vec->getData(), vec_res, scale);
                 else
@@ -193,8 +193,8 @@ private:
             }
             else if (c1_is_const)
             {
-                const ColumnConst * c1_const = checkAndGetColumnConst<ColVecB>(c1.get());
-                B b = c1_const->template getValue<B>();
+                const ColumnConst & c1_const = checkAndGetColumnConst<ColVecB>(*c1);
+                B b = c1_const.template getValue<B>();
                 if (const ColVecA * c0_vec = checkAndGetColumn<ColVecA>(c0.get()))
                     vectorConstant<scale_left, scale_right>(c0_vec->getData(), b, vec_res, scale);
                 else
diff --git a/src/DataTypes/ObjectUtils.cpp b/src/DataTypes/ObjectUtils.cpp
index 99cf092e6cd..7c671fcf44f 100644
--- a/src/DataTypes/ObjectUtils.cpp
+++ b/src/DataTypes/ObjectUtils.cpp
@@ -47,7 +47,7 @@ size_t getNumberOfDimensions(const IDataType & type)
 
 size_t getNumberOfDimensions(const IColumn & column)
 {
-    if (const auto * column_array = checkAndGetColumn<ColumnArray>(column))
+    if (const auto * column_array = checkAndGetColumn<ColumnArray>(&column))
         return column_array->getNumberOfDimensions();
     return 0;
 }
diff --git a/src/DataTypes/Serializations/SerializationBool.cpp b/src/DataTypes/Serializations/SerializationBool.cpp
index d6a74e5cb8f..b63f25ddc35 100644
--- a/src/DataTypes/Serializations/SerializationBool.cpp
+++ b/src/DataTypes/Serializations/SerializationBool.cpp
@@ -28,7 +28,7 @@ constexpr char str_false[6] = "false";
 const ColumnUInt8 * checkAndGetSerializeColumnType(const IColumn & column)
 {
     const auto * col = checkAndGetColumn<ColumnUInt8>(&column);
-    if (!checkAndGetColumn<ColumnUInt8>(&column))
+    if (!col)
         throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Bool type can only serialize columns of type UInt8.{}", column.getName());
     return col;
 }
@@ -36,7 +36,7 @@ const ColumnUInt8 * checkAndGetSerializeColumnType(const IColumn & column)
 ColumnUInt8 * checkAndGetDeserializeColumnType(IColumn & column)
 {
     auto * col =  typeid_cast<ColumnUInt8 *>(&column);
-    if (!checkAndGetColumn<ColumnUInt8>(&column))
+    if (!col)
         throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Bool type can only deserialize columns of type UInt8.{}",
                         column.getName());
     return col;
diff --git a/src/DataTypes/Serializations/SerializationInterval.cpp b/src/DataTypes/Serializations/SerializationInterval.cpp
index 59086d8aef3..c4ef34b4325 100644
--- a/src/DataTypes/Serializations/SerializationInterval.cpp
+++ b/src/DataTypes/Serializations/SerializationInterval.cpp
@@ -17,7 +17,7 @@ namespace ErrorCodes
 void SerializationKustoInterval::serializeText(
     const IColumn & column, const size_t row, WriteBuffer & ostr, const FormatSettings &) const
 {
-    const auto * interval_column = checkAndGetColumn<ColumnInterval>(column);
+    const auto * interval_column = checkAndGetColumn<ColumnInterval>(&column);
     if (!interval_column)
         throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Expected column of underlying type of Interval");
 
diff --git a/src/DataTypes/Serializations/SerializationLowCardinality.cpp b/src/DataTypes/Serializations/SerializationLowCardinality.cpp
index 9efe05042ed..2d2be195098 100644
--- a/src/DataTypes/Serializations/SerializationLowCardinality.cpp
+++ b/src/DataTypes/Serializations/SerializationLowCardinality.cpp
@@ -477,7 +477,7 @@ void SerializationLowCardinality::serializeBinaryBulkWithMultipleStreams(
                             settings.low_cardinality_max_dictionary_size);
     }
 
-    if (const auto * nullable_keys = checkAndGetColumn<ColumnNullable>(*keys))
+    if (const auto * nullable_keys = checkAndGetColumn<ColumnNullable>(&*keys))
         keys = nullable_keys->getNestedColumnPtr();
 
     bool need_additional_keys = !keys->empty();
diff --git a/src/Dictionaries/HierarchyDictionariesUtils.cpp b/src/Dictionaries/HierarchyDictionariesUtils.cpp
index fd59a0c37db..e1119982a34 100644
--- a/src/Dictionaries/HierarchyDictionariesUtils.cpp
+++ b/src/Dictionaries/HierarchyDictionariesUtils.cpp
@@ -95,7 +95,7 @@ namespace
                 parent_key_column_non_null = parent_key_column_typed->getNestedColumnPtr();
             }
 
-            const auto * parent_key_column_typed = checkAndGetColumn<ColumnVector<UInt64>>(*parent_key_column_non_null);
+            const auto * parent_key_column_typed = checkAndGetColumn<ColumnVector<UInt64>>(&*parent_key_column_non_null);
             if (!parent_key_column_typed)
                 throw Exception(ErrorCodes::UNSUPPORTED_METHOD,
                     "Parent key column should be UInt64. Actual {}",
@@ -166,7 +166,7 @@ ColumnPtr getKeysHierarchyDefaultImplementation(
     valid_keys = 0;
 
     key_column = key_column->convertToFullColumnIfConst();
-    const auto * key_column_typed = checkAndGetColumn<ColumnVector<UInt64>>(*key_column);
+    const auto * key_column_typed = checkAndGetColumn<ColumnVector<UInt64>>(&*key_column);
     if (!key_column_typed)
         throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Key column should be UInt64");
 
@@ -224,11 +224,11 @@ ColumnUInt8::Ptr getKeysIsInHierarchyDefaultImplementation(
     key_column = key_column->convertToFullColumnIfConst();
     in_key_column = in_key_column->convertToFullColumnIfConst();
 
-    const auto * key_column_typed = checkAndGetColumn<ColumnVector<UInt64>>(*key_column);
+    const auto * key_column_typed = checkAndGetColumn<ColumnVector<UInt64>>(&*key_column);
     if (!key_column_typed)
         throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Key column should be UInt64");
 
-    const auto * in_key_column_typed = checkAndGetColumn<ColumnVector<UInt64>>(*in_key_column);
+    const auto * in_key_column_typed = checkAndGetColumn<ColumnVector<UInt64>>(&*in_key_column);
     if (!in_key_column_typed)
         throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Key column should be UInt64");
 
diff --git a/src/Formats/insertNullAsDefaultIfNeeded.cpp b/src/Formats/insertNullAsDefaultIfNeeded.cpp
index c42b8c54d73..ff40d036fb5 100644
--- a/src/Formats/insertNullAsDefaultIfNeeded.cpp
+++ b/src/Formats/insertNullAsDefaultIfNeeded.cpp
@@ -19,45 +19,45 @@ bool insertNullAsDefaultIfNeeded(ColumnWithTypeAndName & input_column, const Col
     if (isArray(input_column.type) && isArray(header_column.type))
     {
         ColumnWithTypeAndName nested_input_column;
-        const auto * array_input_column = checkAndGetColumn<ColumnArray>(input_column.column.get());
-        nested_input_column.column = array_input_column->getDataPtr();
+        const auto & array_input_column = checkAndGetColumn<ColumnArray>(*input_column.column);
+        nested_input_column.column = array_input_column.getDataPtr();
         nested_input_column.type = checkAndGetDataType<DataTypeArray>(input_column.type.get())->getNestedType();
 
         ColumnWithTypeAndName nested_header_column;
-        nested_header_column.column = checkAndGetColumn<ColumnArray>(header_column.column.get())->getDataPtr();
+        nested_header_column.column = checkAndGetColumn<ColumnArray>(*header_column.column).getDataPtr();
         nested_header_column.type = checkAndGetDataType<DataTypeArray>(header_column.type.get())->getNestedType();
 
         if (!insertNullAsDefaultIfNeeded(nested_input_column, nested_header_column, 0, nullptr))
             return false;
 
-        input_column.column = ColumnArray::create(nested_input_column.column, array_input_column->getOffsetsPtr());
+        input_column.column = ColumnArray::create(nested_input_column.column, array_input_column.getOffsetsPtr());
         input_column.type = std::make_shared<DataTypeArray>(std::move(nested_input_column.type));
         return true;
     }
 
     if (isTuple(input_column.type) && isTuple(header_column.type))
     {
-        const auto * tuple_input_column = checkAndGetColumn<ColumnTuple>(input_column.column.get());
-        const auto * tuple_input_type = checkAndGetDataType<DataTypeTuple>(input_column.type.get());
-        const auto * tuple_header_column = checkAndGetColumn<ColumnTuple>(header_column.column.get());
-        const auto * tuple_header_type = checkAndGetDataType<DataTypeTuple>(header_column.type.get());
+        const auto & tuple_input_column = checkAndGetColumn<ColumnTuple>(*input_column.column);
+        const auto & tuple_input_type = checkAndGetDataType<DataTypeTuple>(*input_column.type);
+        const auto & tuple_header_column = checkAndGetColumn<ColumnTuple>(*header_column.column);
+        const auto & tuple_header_type = checkAndGetDataType<DataTypeTuple>(*header_column.type);
 
-        if (tuple_input_type->getElements().size() != tuple_header_type->getElements().size())
+        if (tuple_input_type.getElements().size() != tuple_header_type.getElements().size())
             return false;
 
         Columns nested_input_columns;
-        nested_input_columns.reserve(tuple_input_type->getElements().size());
+        nested_input_columns.reserve(tuple_input_type.getElements().size());
         DataTypes nested_input_types;
-        nested_input_types.reserve(tuple_input_type->getElements().size());
+        nested_input_types.reserve(tuple_input_type.getElements().size());
         bool changed = false;
-        for (size_t i = 0; i != tuple_input_type->getElements().size(); ++i)
+        for (size_t i = 0; i != tuple_input_type.getElements().size(); ++i)
         {
             ColumnWithTypeAndName nested_input_column;
-            nested_input_column.column = tuple_input_column->getColumnPtr(i);
-            nested_input_column.type = tuple_input_type->getElement(i);
+            nested_input_column.column = tuple_input_column.getColumnPtr(i);
+            nested_input_column.type = tuple_input_type.getElement(i);
             ColumnWithTypeAndName nested_header_column;
-            nested_header_column.column = tuple_header_column->getColumnPtr(i);
-            nested_header_column.type = tuple_header_type->getElement(i);
+            nested_header_column.column = tuple_header_column.getColumnPtr(i);
+            nested_header_column.type = tuple_header_type.getElement(i);
             changed |= insertNullAsDefaultIfNeeded(nested_input_column, nested_header_column, 0, nullptr);
             nested_input_columns.push_back(std::move(nested_input_column.column));
             nested_input_types.push_back(std::move(nested_input_column.type));
@@ -74,12 +74,12 @@ bool insertNullAsDefaultIfNeeded(ColumnWithTypeAndName & input_column, const Col
     if (isMap(input_column.type) && isMap(header_column.type))
     {
         ColumnWithTypeAndName nested_input_column;
-        nested_input_column.column = checkAndGetColumn<ColumnMap>(input_column.column.get())->getNestedColumnPtr();
-        nested_input_column.type = checkAndGetDataType<DataTypeMap>(input_column.type.get())->getNestedType();
+        nested_input_column.column = checkAndGetColumn<ColumnMap>(*input_column.column).getNestedColumnPtr();
+        nested_input_column.type = checkAndGetDataType<DataTypeMap>(*input_column.type).getNestedType();
 
         ColumnWithTypeAndName nested_header_column;
-        nested_header_column.column = checkAndGetColumn<ColumnMap>(header_column.column.get())->getNestedColumnPtr();
-        nested_header_column.type = checkAndGetDataType<DataTypeMap>(header_column.type.get())->getNestedType();
+        nested_header_column.column = checkAndGetColumn<ColumnMap>(*header_column.column).getNestedColumnPtr();
+        nested_header_column.type = checkAndGetDataType<DataTypeMap>(*header_column.type).getNestedType();
 
         if (!insertNullAsDefaultIfNeeded(nested_input_column, nested_header_column, 0, nullptr))
             return false;
diff --git a/src/Functions/FunctionBase64Conversion.h b/src/Functions/FunctionBase64Conversion.h
index 979c589c64b..3906563a254 100644
--- a/src/Functions/FunctionBase64Conversion.h
+++ b/src/Functions/FunctionBase64Conversion.h
@@ -111,9 +111,9 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         const auto & input_column = arguments[0].column;
-        if (const auto * src_column_as_fixed_string = checkAndGetColumn<ColumnFixedString>(*input_column))
+        if (const auto * src_column_as_fixed_string = checkAndGetColumn<ColumnFixedString>(&*input_column))
             return execute(*src_column_as_fixed_string, input_rows_count);
-        else if (const auto * src_column_as_string = checkAndGetColumn<ColumnString>(*input_column))
+        else if (const auto * src_column_as_string = checkAndGetColumn<ColumnString>(&*input_column))
             return execute(*src_column_as_string, input_rows_count);
 
         throw Exception(
diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 89ff63995b1..8ac602faed9 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -1767,8 +1767,8 @@ public:
         {
             if (const auto * col_right_const = checkAndGetColumnConst<ColumnFixedString>(col_right_raw))
             {
-                const auto * col_left = checkAndGetColumn<ColumnFixedString>(col_left_const->getDataColumn());
-                const auto * col_right = checkAndGetColumn<ColumnFixedString>(col_right_const->getDataColumn());
+                const auto * col_left = &checkAndGetColumn<ColumnFixedString>(col_left_const->getDataColumn());
+                const auto * col_right = &checkAndGetColumn<ColumnFixedString>(col_right_const->getDataColumn());
 
                 if (col_left->getN() != col_right->getN())
                     return nullptr;
@@ -1805,11 +1805,11 @@ public:
 
         const auto * col_left = is_left_column_const
                         ? checkAndGetColumn<ColumnFixedString>(
-                            checkAndGetColumnConst<ColumnFixedString>(col_left_raw)->getDataColumn())
+                            &checkAndGetColumnConst<ColumnFixedString>(col_left_raw)->getDataColumn())
                         : checkAndGetColumn<ColumnFixedString>(col_left_raw);
         const auto * col_right = is_right_column_const
                         ? checkAndGetColumn<ColumnFixedString>(
-                            checkAndGetColumnConst<ColumnFixedString>(col_right_raw)->getDataColumn())
+                            &checkAndGetColumnConst<ColumnFixedString>(col_right_raw)->getDataColumn())
                         : checkAndGetColumn<ColumnFixedString>(col_right_raw);
 
         if (col_left && col_right)
@@ -1881,8 +1881,8 @@ public:
         {
             if (const auto * col_right_const = checkAndGetColumnConst<ColumnString>(col_right_raw))
             {
-                const auto * col_left = checkAndGetColumn<ColumnString>(col_left_const->getDataColumn());
-                const auto * col_right = checkAndGetColumn<ColumnString>(col_right_const->getDataColumn());
+                const auto * col_left = &checkAndGetColumn<ColumnString>(col_left_const->getDataColumn());
+                const auto * col_right = &checkAndGetColumn<ColumnString>(col_right_const->getDataColumn());
 
                 std::string_view a = col_left->getDataAt(0).toView();
                 std::string_view b = col_right->getDataAt(0).toView();
@@ -1897,10 +1897,10 @@ public:
         const bool is_right_column_const = checkAndGetColumnConst<ColumnString>(col_right_raw) != nullptr;
 
         const auto * col_left = is_left_column_const
-            ? checkAndGetColumn<ColumnString>(checkAndGetColumnConst<ColumnString>(col_left_raw)->getDataColumn())
+            ? &checkAndGetColumn<ColumnString>(checkAndGetColumnConst<ColumnString>(col_left_raw)->getDataColumn())
             : checkAndGetColumn<ColumnString>(col_left_raw);
         const auto * col_right = is_right_column_const
-            ? checkAndGetColumn<ColumnString>(checkAndGetColumnConst<ColumnString>(col_right_raw)->getDataColumn())
+            ? &checkAndGetColumn<ColumnString>(checkAndGetColumnConst<ColumnString>(col_right_raw)->getDataColumn())
             : checkAndGetColumn<ColumnString>(col_right_raw);
 
         if (col_left && col_right)
@@ -1948,7 +1948,7 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
 
         const ColumnConst * const col_left_const = checkAndGetColumnConst<LeftColumnType>(col_left_raw);
 
-        const auto * col_left = col_left_const ? checkAndGetColumn<LeftColumnType>(col_left_const->getDataColumn())
+        const auto * col_left = col_left_const ? &checkAndGetColumn<LeftColumnType>(col_left_const->getDataColumn())
                                                : checkAndGetColumn<LeftColumnType>(col_left_raw);
 
         if (!col_left)
@@ -2231,7 +2231,7 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
 
             bool is_const = checkColumnConst<ColumnNullable>(right_argument.column.get());
             const ColumnNullable * nullable_column = is_const ? checkAndGetColumnConstData<ColumnNullable>(right_argument.column.get())
-                                                              : checkAndGetColumn<ColumnNullable>(*right_argument.column);
+                                                              : checkAndGetColumn<ColumnNullable>(right_argument.column.get());
 
             const auto & null_bytemap = nullable_column->getNullMapData();
             auto res = executeImpl2(createBlockWithNestedColumns(arguments), removeNullable(result_type), input_rows_count, &null_bytemap);
diff --git a/src/Functions/FunctionHelpers.cpp b/src/Functions/FunctionHelpers.cpp
index ce83a489a3d..048a601de81 100644
--- a/src/Functions/FunctionHelpers.cpp
+++ b/src/Functions/FunctionHelpers.cpp
@@ -58,14 +58,14 @@ ColumnWithTypeAndName columnGetNested(const ColumnWithTypeAndName & col)
         {
             return ColumnWithTypeAndName{nullptr, nested_type, col.name};
         }
-        else if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*col.column))
+        else if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*col.column))
         {
             const auto & nested_col = nullable->getNestedColumnPtr();
             return ColumnWithTypeAndName{nested_col, nested_type, col.name};
         }
-        else if (const auto * const_column = checkAndGetColumn<ColumnConst>(*col.column))
+        else if (const auto * const_column = checkAndGetColumn<ColumnConst>(&*col.column))
         {
-            const auto * nullable_column = checkAndGetColumn<ColumnNullable>(const_column->getDataColumn());
+            const auto * nullable_column = checkAndGetColumn<ColumnNullable>(&const_column->getDataColumn());
 
             ColumnPtr nullable_res;
             if (nullable_column)
@@ -226,7 +226,7 @@ ColumnPtr wrapInNullable(const ColumnPtr & src, const ColumnsWithTypeAndName & a
 
     if (src->onlyNull())
         return src;
-    else if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*src))
+    else if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*src))
     {
         src_not_nullable = nullable->getNestedColumnPtr();
         result_null_map_column = nullable->getNullMapColumnPtr();
@@ -247,7 +247,7 @@ ColumnPtr wrapInNullable(const ColumnPtr & src, const ColumnsWithTypeAndName & a
         if (isColumnConst(*elem.column))
             continue;
 
-        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*elem.column))
+        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*elem.column))
         {
             const ColumnPtr & null_map_column = nullable->getNullMapColumnPtr();
             if (!result_null_map_column)
diff --git a/src/Functions/FunctionHelpers.h b/src/Functions/FunctionHelpers.h
index 9f44d3e95c2..89b224e79ef 100644
--- a/src/Functions/FunctionHelpers.h
+++ b/src/Functions/FunctionHelpers.h
@@ -25,6 +25,13 @@ const Type * checkAndGetDataType(const IDataType * data_type)
     return typeid_cast<const Type *>(data_type);
 }
 
+/// Throws on mismatch.
+template <typename Type>
+const Type & checkAndGetDataType(const IDataType & data_type)
+{
+    return typeid_cast<const Type &>(data_type);
+}
+
 template <typename... Types>
 bool checkDataTypes(const IDataType * data_type)
 {
@@ -34,10 +41,12 @@ bool checkDataTypes(const IDataType * data_type)
 template <typename Type>
 const ColumnConst * checkAndGetColumnConst(const IColumn * column)
 {
-    if (!column || !isColumnConst(*column))
+    if (!column)
         return {};
 
-    const ColumnConst * res = assert_cast<const ColumnConst *>(column);
+    const ColumnConst * res = checkAndGetColumn<ColumnConst>(column);
+    if (!res)
+        return {};
 
     if (!checkColumn<Type>(&res->getDataColumn()))
         return {};
@@ -45,6 +54,18 @@ const ColumnConst * checkAndGetColumnConst(const IColumn * column)
     return res;
 }
 
+template <typename Type>
+const ColumnConst & checkAndGetColumnConst(const IColumn & column)
+{
+    const ColumnConst & res = checkAndGetColumn<ColumnConst>(column);
+
+    const auto & data_column = res.getDataColumn();
+    if (!checkColumn<Type>(&data_column))
+        throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Unexpected const column type: expected {}, got {}", demangle(typeid(Type).name()), demangle(typeid(data_column).name()));
+
+    return res;
+}
+
 template <typename Type>
 const Type * checkAndGetColumnConstData(const IColumn * column)
 {
diff --git a/src/Functions/FunctionUnixTimestamp64.h b/src/Functions/FunctionUnixTimestamp64.h
index 53421a565cb..c418163343b 100644
--- a/src/Functions/FunctionUnixTimestamp64.h
+++ b/src/Functions/FunctionUnixTimestamp64.h
@@ -140,7 +140,7 @@ public:
         const auto & src = arguments[0];
         const auto & col = *src.column;
 
-        if (!checkAndGetColumn<ColumnVector<T>>(col))
+        if (!checkAndGetColumn<ColumnVector<T>>(&col))
             return false;
 
         auto & result_data = result_column->getData();
diff --git a/src/Functions/FunctionsBitmap.h b/src/Functions/FunctionsBitmap.h
index 22d46fa7728..92ec71a3118 100644
--- a/src/Functions/FunctionsBitmap.h
+++ b/src/Functions/FunctionsBitmap.h
@@ -193,8 +193,8 @@ private:
         const ColumnArray * array = typeid_cast<const ColumnArray *>(arguments[0].column.get());
         const ColumnPtr & mapped = array->getDataPtr();
         const ColumnArray::Offsets & offsets = array->getOffsets();
-        const ColumnVector<T> * column = checkAndGetColumn<ColumnVector<T>>(&*mapped);
-        const typename ColumnVector<T>::Container & input_data = column->getData();
+        const ColumnVector<T> & column = checkAndGetColumn<ColumnVector<T>>(*mapped);
+        const typename ColumnVector<T>::Container & input_data = column.getData();
 
         // output data
         Array params_row;
diff --git a/src/Functions/FunctionsCodingIP.cpp b/src/Functions/FunctionsCodingIP.cpp
index 7bdbac6531d..54f7b6dd1f4 100644
--- a/src/Functions/FunctionsCodingIP.cpp
+++ b/src/Functions/FunctionsCodingIP.cpp
@@ -536,7 +536,7 @@ public:
         const auto & col_type_name = arguments[0];
         const ColumnPtr & column = col_type_name.column;
 
-        if (const auto * col_in = checkAndGetColumn<ColumnIPv4>(*column))
+        if (const auto * col_in = checkAndGetColumn<ColumnIPv4>(&*column))
         {
             auto col_res = ColumnIPv6::create();
 
@@ -551,7 +551,7 @@ public:
             return col_res;
         }
 
-        if (const auto * col_in = checkAndGetColumn<ColumnUInt32>(*column))
+        if (const auto * col_in = checkAndGetColumn<ColumnUInt32>(&*column))
         {
             auto col_res = ColumnFixedString::create(IPV6_BINARY_LENGTH);
 
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index a16ce136b9a..02da450e0c2 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -3302,7 +3302,7 @@ private:
             /// both columns have type UInt8, but we shouldn't use identity wrapper,
             /// because Bool column can contain only 0 and 1.
             auto res_column = to_type->createColumn();
-            const auto & data_from = checkAndGetColumn<ColumnUInt8>(arguments[0].column.get())->getData();
+            const auto & data_from = checkAndGetColumn<ColumnUInt8>(*arguments[0].column).getData();
             auto & data_to = assert_cast<ColumnUInt8 *>(res_column.get())->getData();
             data_to.resize(data_from.size());
             for (size_t i = 0; i != data_from.size(); ++i)
diff --git a/src/Functions/FunctionsRound.h b/src/Functions/FunctionsRound.h
index 3d1028c6d35..24ffb5eb0c1 100644
--- a/src/Functions/FunctionsRound.h
+++ b/src/Functions/FunctionsRound.h
@@ -467,28 +467,28 @@ struct Dispatcher
 
     static ColumnPtr apply(const IColumn * col_general, Scale scale_arg)
     {
-        const auto * const col = checkAndGetColumn<ColumnVector<T>>(col_general);
+        const auto & col = checkAndGetColumn<ColumnVector<T>>(*col_general);
         auto col_res = ColumnVector<T>::create();
 
         typename ColumnVector<T>::Container & vec_res = col_res->getData();
-        vec_res.resize(col->getData().size());
+        vec_res.resize(col.getData().size());
 
         if (!vec_res.empty())
         {
             if (scale_arg == 0)
             {
                 size_t scale = 1;
-                FunctionRoundingImpl<ScaleMode::Zero>::apply(col->getData(), scale, vec_res);
+                FunctionRoundingImpl<ScaleMode::Zero>::apply(col.getData(), scale, vec_res);
             }
             else if (scale_arg > 0)
             {
                 size_t scale = intExp10(scale_arg);
-                FunctionRoundingImpl<ScaleMode::Positive>::apply(col->getData(), scale, vec_res);
+                FunctionRoundingImpl<ScaleMode::Positive>::apply(col.getData(), scale, vec_res);
             }
             else
             {
                 size_t scale = intExp10(-scale_arg);
-                FunctionRoundingImpl<ScaleMode::Negative>::apply(col->getData(), scale, vec_res);
+                FunctionRoundingImpl<ScaleMode::Negative>::apply(col.getData(), scale, vec_res);
             }
         }
 
@@ -502,14 +502,14 @@ struct Dispatcher<T, rounding_mode, tie_breaking_mode>
 public:
     static ColumnPtr apply(const IColumn * col_general, Scale scale_arg)
     {
-        const auto * const col = checkAndGetColumn<ColumnDecimal<T>>(col_general);
-        const typename ColumnDecimal<T>::Container & vec_src = col->getData();
+        const auto & col = checkAndGetColumn<ColumnDecimal<T>>(*col_general);
+        const typename ColumnDecimal<T>::Container & vec_src = col.getData();
 
-        auto col_res = ColumnDecimal<T>::create(vec_src.size(), col->getScale());
+        auto col_res = ColumnDecimal<T>::create(vec_src.size(), col.getScale());
         auto & vec_res = col_res->getData();
 
         if (!vec_res.empty())
-            DecimalRoundingImpl<T, rounding_mode, tie_breaking_mode>::apply(col->getData(), col->getScale(), vec_res, scale_arg);
+            DecimalRoundingImpl<T, rounding_mode, tie_breaking_mode>::apply(col.getData(), col.getScale(), vec_res, scale_arg);
 
         return col_res;
     }
diff --git a/src/Functions/FunctionsStringHash.h b/src/Functions/FunctionsStringHash.h
index d951e77395e..fcd4c970a47 100644
--- a/src/Functions/FunctionsStringHash.h
+++ b/src/Functions/FunctionsStringHash.h
@@ -153,8 +153,8 @@ public:
             auto col_res = ColumnVector<UInt64>::create();
             auto & vec_res = col_res->getData();
             vec_res.resize(column->size());
-            const ColumnString * col_str_vector = checkAndGetColumn<ColumnString>(&*column);
-            Impl::apply(col_str_vector->getChars(), col_str_vector->getOffsets(), shingle_size, vec_res);
+            const ColumnString & col_str_vector = checkAndGetColumn<ColumnString>(*column);
+            Impl::apply(col_str_vector.getChars(), col_str_vector.getOffsets(), shingle_size, vec_res);
             return col_res;
         }
         else if constexpr (is_arg) // Min hash arg
@@ -170,8 +170,8 @@ public:
             auto min_tuple = ColumnTuple::create(std::move(min_columns));
             auto max_tuple = ColumnTuple::create(std::move(max_columns));
 
-            const ColumnString * col_str_vector = checkAndGetColumn<ColumnString>(&*column);
-            Impl::apply(col_str_vector->getChars(), col_str_vector->getOffsets(), shingle_size, num_hashes, nullptr, nullptr, min_tuple.get(), max_tuple.get());
+            const ColumnString & col_str_vector = checkAndGetColumn<ColumnString>(*column);
+            Impl::apply(col_str_vector.getChars(), col_str_vector.getOffsets(), shingle_size, num_hashes, nullptr, nullptr, min_tuple.get(), max_tuple.get());
 
             MutableColumns tuple_columns;
             tuple_columns.emplace_back(std::move(min_tuple));
@@ -186,8 +186,8 @@ public:
             auto & vec_h2 = col_h2->getData();
             vec_h1.resize(column->size());
             vec_h2.resize(column->size());
-            const ColumnString * col_str_vector = checkAndGetColumn<ColumnString>(&*column);
-            Impl::apply(col_str_vector->getChars(), col_str_vector->getOffsets(), shingle_size, num_hashes, &vec_h1, &vec_h2, nullptr, nullptr);
+            const ColumnString & col_str_vector = checkAndGetColumn<ColumnString>(*column);
+            Impl::apply(col_str_vector.getChars(), col_str_vector.getOffsets(), shingle_size, num_hashes, &vec_h1, &vec_h2, nullptr, nullptr);
             MutableColumns tuple_columns;
             tuple_columns.emplace_back(std::move(col_h1));
             tuple_columns.emplace_back(std::move(col_h2));
diff --git a/src/Functions/Kusto/KqlArraySort.cpp b/src/Functions/Kusto/KqlArraySort.cpp
index 5be36328cc3..22544f4302c 100644
--- a/src/Functions/Kusto/KqlArraySort.cpp
+++ b/src/Functions/Kusto/KqlArraySort.cpp
@@ -158,12 +158,12 @@ public:
                 auto out_tmp = ColumnArray::create(nested_types[i]->createColumn());
 
                 size_t array_size = tuple_coulmn->size();
-                const auto * arr = checkAndGetColumn<ColumnArray>(tuple_coulmn.get());
+                const auto & arr = checkAndGetColumn<ColumnArray>(*tuple_coulmn);
 
                 for (size_t j = 0; j < array_size; ++j)
                 {
                     Field arr_field;
-                    arr->get(j, arr_field);
+                    arr.get(j, arr_field);
                     out_tmp->insert(arr_field);
                 }
 
diff --git a/src/Functions/MultiMatchAllIndicesImpl.h b/src/Functions/MultiMatchAllIndicesImpl.h
index d655311f532..3e9c8fba215 100644
--- a/src/Functions/MultiMatchAllIndicesImpl.h
+++ b/src/Functions/MultiMatchAllIndicesImpl.h
@@ -185,7 +185,7 @@ struct MultiMatchAllIndicesImpl
         size_t prev_haystack_offset = 0;
         size_t prev_needles_offset = 0;
 
-        const ColumnString * needles_data_string = checkAndGetColumn<ColumnString>(&needles_data);
+        const ColumnString & needles_data_string = checkAndGetColumn<ColumnString>(needles_data);
 
         std::vector<std::string_view> needles;
 
@@ -195,7 +195,7 @@ struct MultiMatchAllIndicesImpl
 
             for (size_t j = prev_needles_offset; j < needles_offsets[i]; ++j)
             {
-                needles.emplace_back(needles_data_string->getDataAt(j).toView());
+                needles.emplace_back(needles_data_string.getDataAt(j).toView());
             }
 
             if (needles.empty())
diff --git a/src/Functions/MultiMatchAnyImpl.h b/src/Functions/MultiMatchAnyImpl.h
index 0b9eee2382f..000c334f6c1 100644
--- a/src/Functions/MultiMatchAnyImpl.h
+++ b/src/Functions/MultiMatchAnyImpl.h
@@ -212,7 +212,7 @@ struct MultiMatchAnyImpl
         size_t prev_haystack_offset = 0;
         size_t prev_needles_offset = 0;
 
-        const ColumnString * needles_data_string = checkAndGetColumn<ColumnString>(&needles_data);
+        const ColumnString & needles_data_string = checkAndGetColumn<ColumnString>(needles_data);
 
         std::vector<std::string_view> needles;
 
@@ -221,7 +221,7 @@ struct MultiMatchAnyImpl
             needles.reserve(needles_offsets[i] - prev_needles_offset);
 
             for (size_t j = prev_needles_offset; j < needles_offsets[i]; ++j)
-                needles.emplace_back(needles_data_string->getDataAt(j).toView());
+                needles.emplace_back(needles_data_string.getDataAt(j).toView());
 
             if (needles.empty())
             {
diff --git a/src/Functions/MultiSearchAllPositionsImpl.h b/src/Functions/MultiSearchAllPositionsImpl.h
index 6e1f13d87b6..cfe60e51bcd 100644
--- a/src/Functions/MultiSearchAllPositionsImpl.h
+++ b/src/Functions/MultiSearchAllPositionsImpl.h
@@ -89,7 +89,7 @@ struct MultiSearchAllPositionsImpl
 
         offsets_res.reserve(haystack_offsets.size());
 
-        const ColumnString * needles_data_string = checkAndGetColumn<ColumnString>(&needles_data);
+        const ColumnString & needles_data_string = checkAndGetColumn<ColumnString>(needles_data);
 
         std::vector<std::string_view> needles;
 
@@ -99,7 +99,7 @@ struct MultiSearchAllPositionsImpl
 
             for (size_t j = prev_needles_offset; j < needles_offsets[i]; ++j)
             {
-                needles.emplace_back(needles_data_string->getDataAt(j).toView());
+                needles.emplace_back(needles_data_string.getDataAt(j).toView());
             }
 
             const size_t needles_size = needles.size();
diff --git a/src/Functions/MultiSearchFirstIndexImpl.h b/src/Functions/MultiSearchFirstIndexImpl.h
index 73f3c92adfb..36a5fd514d9 100644
--- a/src/Functions/MultiSearchFirstIndexImpl.h
+++ b/src/Functions/MultiSearchFirstIndexImpl.h
@@ -88,7 +88,7 @@ struct MultiSearchFirstIndexImpl
         size_t prev_haystack_offset = 0;
         size_t prev_needles_offset = 0;
 
-        const ColumnString * needles_data_string = checkAndGetColumn<ColumnString>(&needles_data);
+        const ColumnString & needles_data_string = checkAndGetColumn<ColumnString>(needles_data);
 
         std::vector<std::string_view> needles;
 
@@ -98,7 +98,7 @@ struct MultiSearchFirstIndexImpl
 
             for (size_t j = prev_needles_offset; j < needles_offsets[i]; ++j)
             {
-                needles.emplace_back(needles_data_string->getDataAt(j).toView());
+                needles.emplace_back(needles_data_string.getDataAt(j).toView());
             }
 
             auto searcher = Impl::createMultiSearcherInBigHaystack(needles); // sub-optimal
diff --git a/src/Functions/MultiSearchFirstPositionImpl.h b/src/Functions/MultiSearchFirstPositionImpl.h
index 99dd3f9d394..8b137bb67d1 100644
--- a/src/Functions/MultiSearchFirstPositionImpl.h
+++ b/src/Functions/MultiSearchFirstPositionImpl.h
@@ -97,7 +97,7 @@ struct MultiSearchFirstPositionImpl
         size_t prev_haystack_offset = 0;
         size_t prev_needles_offset = 0;
 
-        const ColumnString * needles_data_string = checkAndGetColumn<ColumnString>(&needles_data);
+        const ColumnString & needles_data_string = checkAndGetColumn<ColumnString>(needles_data);
 
         std::vector<std::string_view> needles;
 
@@ -112,7 +112,7 @@ struct MultiSearchFirstPositionImpl
 
             for (size_t j = prev_needles_offset; j < needles_offsets[i]; ++j)
             {
-                needles.emplace_back(needles_data_string->getDataAt(j).toView());
+                needles.emplace_back(needles_data_string.getDataAt(j).toView());
             }
 
             auto searcher = Impl::createMultiSearcherInBigHaystack(needles); // sub-optimal
diff --git a/src/Functions/MultiSearchImpl.h b/src/Functions/MultiSearchImpl.h
index fb7d56f302a..494eb323639 100644
--- a/src/Functions/MultiSearchImpl.h
+++ b/src/Functions/MultiSearchImpl.h
@@ -87,7 +87,7 @@ struct MultiSearchImpl
         size_t prev_haystack_offset = 0;
         size_t prev_needles_offset = 0;
 
-        const ColumnString * needles_data_string = checkAndGetColumn<ColumnString>(&needles_data);
+        const ColumnString & needles_data_string = checkAndGetColumn<ColumnString>(needles_data);
 
         std::vector<std::string_view> needles;
 
@@ -97,7 +97,7 @@ struct MultiSearchImpl
 
             for (size_t j = prev_needles_offset; j < needles_offsets[i]; ++j)
             {
-                needles.emplace_back(needles_data_string->getDataAt(j).toView());
+                needles.emplace_back(needles_data_string.getDataAt(j).toView());
             }
 
             const auto * const haystack = &haystack_data[prev_haystack_offset];
diff --git a/src/Functions/URL/FirstSignificantSubdomainCustomImpl.h b/src/Functions/URL/FirstSignificantSubdomainCustomImpl.h
index 93691e35741..68582198ea3 100644
--- a/src/Functions/URL/FirstSignificantSubdomainCustomImpl.h
+++ b/src/Functions/URL/FirstSignificantSubdomainCustomImpl.h
@@ -69,7 +69,7 @@ public:
         const ColumnConst * column_tld_list_name = checkAndGetColumnConstStringOrFixedString(arguments[1].column.get());
         FirstSignificantSubdomainCustomLookup tld_lookup(column_tld_list_name->getValue<String>());
 
-        if (const ColumnString * col = checkAndGetColumn<ColumnString>(*arguments[0].column))
+        if (const ColumnString * col = checkAndGetColumn<ColumnString>(&*arguments[0].column))
         {
             auto col_res = ColumnString::create();
             vector(tld_lookup, col->getChars(), col->getOffsets(), col_res->getChars(), col_res->getOffsets());
diff --git a/src/Functions/array/FunctionArrayMapped.h b/src/Functions/array/FunctionArrayMapped.h
index 5d6d70521b0..3c8dc04de46 100644
--- a/src/Functions/array/FunctionArrayMapped.h
+++ b/src/Functions/array/FunctionArrayMapped.h
@@ -317,7 +317,7 @@ public:
                             ErrorCodes::ILLEGAL_COLUMN, "Expected Array column, found {}", column_array_ptr->getName());
 
                     column_array_ptr = recursiveRemoveLowCardinality(column_const_array->convertToFullColumn());
-                    column_array = checkAndGetColumn<ColumnArray>(column_array_ptr.get());
+                    column_array = &checkAndGetColumn<ColumnArray>(*column_array_ptr);
                 }
 
                 if (!array_type)
diff --git a/src/Functions/array/arrayCompact.cpp b/src/Functions/array/arrayCompact.cpp
index 7d09d1078d5..fe870bebd84 100644
--- a/src/Functions/array/arrayCompact.cpp
+++ b/src/Functions/array/arrayCompact.cpp
@@ -34,7 +34,7 @@ struct ArrayCompactImpl
         using ColVecType = ColumnVectorOrDecimal<T>;
 
         const ColVecType * check_values_column = checkAndGetColumn<ColVecType>(mapped.get());
-        const ColVecType * src_values_column = checkAndGetColumn<ColVecType>(array.getData());
+        const ColVecType * src_values_column = checkAndGetColumn<ColVecType>(&array.getData());
 
         if (!src_values_column || !check_values_column)
             return false;
diff --git a/src/Functions/array/arrayDistinct.cpp b/src/Functions/array/arrayDistinct.cpp
index ea331d6bdad..2344742e4fd 100644
--- a/src/Functions/array/arrayDistinct.cpp
+++ b/src/Functions/array/arrayDistinct.cpp
@@ -89,20 +89,20 @@ private:
 ColumnPtr FunctionArrayDistinct::executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /*input_rows_count*/) const
 {
     ColumnPtr array_ptr = arguments[0].column;
-    const ColumnArray * array = checkAndGetColumn<ColumnArray>(array_ptr.get());
+    const ColumnArray & array = checkAndGetColumn<ColumnArray>(*array_ptr);
 
     const auto & return_type = result_type;
 
     auto res_ptr = return_type->createColumn();
     ColumnArray & res = assert_cast<ColumnArray &>(*res_ptr);
 
-    const IColumn & src_data = array->getData();
-    const ColumnArray::Offsets & offsets = array->getOffsets();
+    const IColumn & src_data = array.getData();
+    const ColumnArray::Offsets & offsets = array.getOffsets();
 
     IColumn & res_data = res.getData();
     ColumnArray::Offsets & res_offsets = res.getOffsets();
 
-    const ColumnNullable * nullable_col = checkAndGetColumn<ColumnNullable>(src_data);
+    const ColumnNullable * nullable_col = checkAndGetColumn<ColumnNullable>(&src_data);
 
     const IColumn * inner_col;
 
diff --git a/src/Functions/array/arrayElement.cpp b/src/Functions/array/arrayElement.cpp
index 8669fd1f3a7..227b29d5d9f 100644
--- a/src/Functions/array/arrayElement.cpp
+++ b/src/Functions/array/arrayElement.cpp
@@ -1538,9 +1538,9 @@ ColumnPtr FunctionArrayElement::executeMap2(const ColumnsWithTypeAndName & argum
         return nullptr;
 
     const ColumnArray * col_map_nested = &col_map->getNestedColumn();
-    const ColumnTuple * col_map_kv = checkAndGetColumn<ColumnTuple>(col_map_nested->getDataPtr().get());
-    ColumnPtr col_map_keys = col_map_kv->getColumnPtr(0);
-    ColumnPtr col_map_values = col_map_kv->getColumnPtr(1);
+    const ColumnTuple & col_map_kv = checkAndGetColumn<ColumnTuple>(*col_map_nested->getDataPtr());
+    ColumnPtr col_map_keys = col_map_kv.getColumnPtr(0);
+    ColumnPtr col_map_values = col_map_kv.getColumnPtr(1);
 
     const DataTypeMap & map_type
         = typeid_cast<const DataTypeMap &>(*typeid_cast<const DataTypeArray &>(*arguments[0].type).getNestedType());
diff --git a/src/Functions/array/arrayEnumerateExtended.h b/src/Functions/array/arrayEnumerateExtended.h
index cf38afcfa5a..62850a1cbf0 100644
--- a/src/Functions/array/arrayEnumerateExtended.h
+++ b/src/Functions/array/arrayEnumerateExtended.h
@@ -165,7 +165,7 @@ ColumnPtr FunctionArrayEnumerateExtended<Derived>::executeImpl(const ColumnsWith
 
     for (size_t i = 0; i < num_arguments; ++i)
     {
-        if (const auto * nullable_col = checkAndGetColumn<ColumnNullable>(*data_columns[i]))
+        if (const auto * nullable_col = checkAndGetColumn<ColumnNullable>(data_columns[i]))
         {
             if (num_arguments == 1)
                 data_columns[i] = &nullable_col->getNestedColumn();
diff --git a/src/Functions/array/arrayIndex.h b/src/Functions/array/arrayIndex.h
index cd537763b4a..c0b1c773387 100644
--- a/src/Functions/array/arrayIndex.h
+++ b/src/Functions/array/arrayIndex.h
@@ -506,10 +506,10 @@ private:
         const ColumnNullable * nullable = nullptr;
 
         if (col_array)
-            nullable = checkAndGetColumn<ColumnNullable>(col_array->getData());
+            nullable = checkAndGetColumn<ColumnNullable>(&col_array->getData());
 
         const auto & arg_column = arguments[1].column;
-        const ColumnNullable * arg_nullable = checkAndGetColumn<ColumnNullable>(*arg_column);
+        const ColumnNullable * arg_nullable = checkAndGetColumn<ColumnNullable>(&*arg_column);
 
         if (!nullable && !arg_nullable)
         {
@@ -738,7 +738,7 @@ private:
 
         const auto [null_map_data, null_map_item] = getNullMaps(arguments);
 
-        if (const ColumnConst * col_arg_const = checkAndGetColumn<ColumnConst>(*arguments[1].column))
+        if (const ColumnConst * col_arg_const = checkAndGetColumn<ColumnConst>(&*arguments[1].column))
         {
             const IColumnUnique & col_lc_dict = col_lc->getDictionary();
 
@@ -754,7 +754,7 @@ private:
             if (!col_arg_cloned->isNullAt(0))
             {
                 if (col_arg_cloned->isNullable())
-                    col_arg_cloned = checkAndGetColumn<ColumnNullable>(*col_arg_cloned)->getNestedColumnPtr();
+                    col_arg_cloned = checkAndGetColumn<ColumnNullable>(*col_arg_cloned).getNestedColumnPtr();
 
                 StringRef elem = col_arg_cloned->getDataAt(0);
 
@@ -786,7 +786,7 @@ private:
         else if (col_lc->nestedIsNullable()) // LowCardinality(Nullable(T)) and U
         {
             const ColumnPtr left_casted = col_lc->convertToFullColumnIfLowCardinality(); // Nullable(T)
-            const ColumnNullable& left_nullable = *checkAndGetColumn<ColumnNullable>(left_casted.get());
+            const ColumnNullable & left_nullable = checkAndGetColumn<ColumnNullable>(*left_casted);
 
             const NullMap * const null_map_left_casted = &left_nullable.getNullMapColumn().getData();
 
diff --git a/src/Functions/array/arrayJaccardIndex.cpp b/src/Functions/array/arrayJaccardIndex.cpp
index 9cb74a7aa62..87f3390ac73 100644
--- a/src/Functions/array/arrayJaccardIndex.cpp
+++ b/src/Functions/array/arrayJaccardIndex.cpp
@@ -97,8 +97,8 @@ public:
         {
             if (const ColumnConst * col_const = typeid_cast<const ColumnConst *>(col.column.get()))
             {
-                const ColumnArray * col_const_array = checkAndGetColumn<ColumnArray>(col_const->getDataColumnPtr().get());
-                return {col_const_array, true};
+                const ColumnArray & col_const_array = checkAndGetColumn<ColumnArray>(*col_const->getDataColumnPtr());
+                return {&col_const_array, true};
             }
             else if (const ColumnArray * col_non_const_array = checkAndGetColumn<ColumnArray>(col.column.get()))
                 return {col_non_const_array, false};
@@ -128,8 +128,8 @@ public:
         vectorWithEmptyIntersect<left_is_const, right_is_const>(left_array->getOffsets(), right_array->getOffsets(), vec_res); \
     else \
     { \
-        const ColumnArray * intersect_column_array = checkAndGetColumn<ColumnArray>(intersect_column.column.get()); \
-        vector<left_is_const, right_is_const>(intersect_column_array->getOffsets(), left_array->getOffsets(), right_array->getOffsets(), vec_res); \
+        const ColumnArray & intersect_column_array = checkAndGetColumn<ColumnArray>(*intersect_column.column); \
+        vector<left_is_const, right_is_const>(intersect_column_array.getOffsets(), left_array->getOffsets(), right_array->getOffsets(), vec_res); \
     }
 
         if (!left_is_const && !right_is_const)
diff --git a/src/Functions/array/arrayUniq.cpp b/src/Functions/array/arrayUniq.cpp
index 81ba5b62094..f92daf384d2 100644
--- a/src/Functions/array/arrayUniq.cpp
+++ b/src/Functions/array/arrayUniq.cpp
@@ -162,7 +162,7 @@ ColumnPtr FunctionArrayUniq::executeImpl(const ColumnsWithTypeAndName & argument
 
     for (size_t i = 0; i < num_arguments; ++i)
     {
-        if (const auto * nullable_col = checkAndGetColumn<ColumnNullable>(*data_columns[i]))
+        if (const auto * nullable_col = checkAndGetColumn<ColumnNullable>(data_columns[i]))
         {
             if (num_arguments == 1)
                 data_columns[i] = &nullable_col->getNestedColumn();
diff --git a/src/Functions/array/emptyArrayToSingle.cpp b/src/Functions/array/emptyArrayToSingle.cpp
index 86d4c32265a..2071abf9911 100644
--- a/src/Functions/array/emptyArrayToSingle.cpp
+++ b/src/Functions/array/emptyArrayToSingle.cpp
@@ -391,7 +391,7 @@ ColumnPtr FunctionEmptyArrayToSingle::executeImpl(const ColumnsWithTypeAndName &
     const IColumn * inner_col;
     IColumn * inner_res_col;
 
-    const auto * nullable_col = checkAndGetColumn<ColumnNullable>(src_data);
+    const auto * nullable_col = checkAndGetColumn<ColumnNullable>(&src_data);
     if (nullable_col)
     {
         inner_col = &nullable_col->getNestedColumn();
diff --git a/src/Functions/array/range.cpp b/src/Functions/array/range.cpp
index 57679ccb180..f939ea7b462 100644
--- a/src/Functions/array/range.cpp
+++ b/src/Functions/array/range.cpp
@@ -404,7 +404,7 @@ private:
         {
             if (!col.type->isNullable())
                 return;
-            const ColumnNullable * nullable_col = checkAndGetColumn<ColumnNullable>(*col.column);
+            const ColumnNullable * nullable_col = checkAndGetColumn<ColumnNullable>(col.column.get());
             if (!nullable_col)
                 nullable_col = checkAndGetColumnConstData<ColumnNullable>(col.column.get());
             if (!nullable_col)
@@ -421,8 +421,8 @@ private:
             const auto * col = arguments[0].column.get();
             if (arguments[0].type->isNullable())
             {
-                const auto * nullable = checkAndGetColumn<ColumnNullable>(*arguments[0].column);
-                col = nullable->getNestedColumnPtr().get();
+                const auto & nullable = checkAndGetColumn<ColumnNullable>(*arguments[0].column);
+                col = nullable.getNestedColumnPtr().get();
             }
 
             if (!((res = executeInternal<UInt8>(col)) || (res = executeInternal<UInt16>(col)) || (res = executeInternal<UInt32>(col))
diff --git a/src/Functions/arrayStringConcat.cpp b/src/Functions/arrayStringConcat.cpp
index c186c0ca7e6..b787feeeca1 100644
--- a/src/Functions/arrayStringConcat.cpp
+++ b/src/Functions/arrayStringConcat.cpp
@@ -183,7 +183,7 @@ public:
         const ColumnString & col_string = assert_cast<const ColumnString &>(*str_subcolumn.get());
 
         auto col_res = ColumnString::create();
-        if (const ColumnNullable * col_nullable = checkAndGetColumn<ColumnNullable>(col_arr.getData()))
+        if (const ColumnNullable * col_nullable = checkAndGetColumn<ColumnNullable>(&col_arr.getData()))
             executeInternal(col_string, col_arr, delimiter, *col_res, col_nullable->getNullMapData().data());
         else
             executeInternal(col_string, col_arr, delimiter, *col_res);
diff --git a/src/Functions/assumeNotNull.cpp b/src/Functions/assumeNotNull.cpp
index 4dd88163ecb..be9d38f5af3 100644
--- a/src/Functions/assumeNotNull.cpp
+++ b/src/Functions/assumeNotNull.cpp
@@ -54,7 +54,7 @@ public:
         if (arguments[0].type->onlyNull() && !col->empty())
             throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot create non-empty column with type Nothing");
 
-        if (const auto * nullable_col = checkAndGetColumn<ColumnNullable>(*col))
+        if (const auto * nullable_col = checkAndGetColumn<ColumnNullable>(&*col))
             return nullable_col->getNestedColumnPtr();
         else
             return col;
diff --git a/src/Functions/coalesce.cpp b/src/Functions/coalesce.cpp
index 4ae90a9db13..722f32af523 100644
--- a/src/Functions/coalesce.cpp
+++ b/src/Functions/coalesce.cpp
@@ -157,12 +157,12 @@ public:
         /// if last argument is not nullable, result should be also not nullable
         if (!multi_if_args.back().column->isNullable() && res->isNullable())
         {
-            if (const auto * column_lc = checkAndGetColumn<ColumnLowCardinality>(*res))
-                res = checkAndGetColumn<ColumnNullable>(*column_lc->convertToFullColumn())->getNestedColumnPtr();
-            else if (const auto * column_const = checkAndGetColumn<ColumnConst>(*res))
-                res = checkAndGetColumn<ColumnNullable>(column_const->getDataColumn())->getNestedColumnPtr();
+            if (const auto * column_lc = checkAndGetColumn<ColumnLowCardinality>(&*res))
+                res = checkAndGetColumn<ColumnNullable>(*column_lc->convertToFullColumn()).getNestedColumnPtr();
+            else if (const auto * column_const = checkAndGetColumn<ColumnConst>(&*res))
+                res = checkAndGetColumn<ColumnNullable>(column_const->getDataColumn()).getNestedColumnPtr();
             else
-                res = checkAndGetColumn<ColumnNullable>(*res)->getNestedColumnPtr();
+                res = checkAndGetColumn<ColumnNullable>(&*res)->getNestedColumnPtr();
         }
 
         return res;
diff --git a/src/Functions/fromModifiedJulianDay.cpp b/src/Functions/fromModifiedJulianDay.cpp
index 695d1b7d63c..a1a3102c70e 100644
--- a/src/Functions/fromModifiedJulianDay.cpp
+++ b/src/Functions/fromModifiedJulianDay.cpp
@@ -34,8 +34,8 @@ namespace DB
         ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
         {
             using ColVecType = typename FromDataType::ColumnType;
-            const ColVecType * col_from = checkAndGetColumn<ColVecType>(arguments[0].column.get());
-            const typename ColVecType::Container & vec_from = col_from->getData();
+            const ColVecType & col_from = checkAndGetColumn<ColVecType>(*arguments[0].column);
+            const typename ColVecType::Container & vec_from = col_from.getData();
 
             auto col_to = ColumnString::create();
             ColumnString::Chars & data_to = col_to->getChars();
diff --git a/src/Functions/grouping.h b/src/Functions/grouping.h
index 830c509f1f5..85ba1967909 100644
--- a/src/Functions/grouping.h
+++ b/src/Functions/grouping.h
@@ -55,7 +55,7 @@ public:
     template <typename AggregationKeyChecker>
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, size_t input_rows_count, AggregationKeyChecker checker) const
     {
-        const auto * grouping_set_column = checkAndGetColumn<ColumnUInt64>(arguments[0].column.get());
+        const auto & grouping_set_column = checkAndGetColumn<ColumnUInt64>(*arguments[0].column);
 
         auto result = ColumnUInt64::create();
         auto & result_data = result->getData();
@@ -64,7 +64,7 @@ public:
         const auto * result_table = likely(force_compatibility) ? COMPATIBLE_MODE : INCOMPATIBLE_MODE;
         for (size_t i = 0; i < input_rows_count; ++i)
         {
-            UInt64 set_index = grouping_set_column->getElement(i);
+            UInt64 set_index = grouping_set_column.getElement(i);
 
             UInt64 value = 0;
             for (auto index : arguments_indexes)
diff --git a/src/Functions/hasColumnInTable.cpp b/src/Functions/hasColumnInTable.cpp
index 48783a672e2..8ea16f688ee 100644
--- a/src/Functions/hasColumnInTable.cpp
+++ b/src/Functions/hasColumnInTable.cpp
@@ -88,8 +88,8 @@ ColumnPtr FunctionHasColumnInTable::executeImpl(const ColumnsWithTypeAndName & a
 {
     auto get_string_from_columns = [&](const ColumnWithTypeAndName & column) -> String
     {
-        const ColumnConst * const_column = checkAndGetColumnConst<ColumnString>(column.column.get());
-        return const_column->getValue<String>();
+        const ColumnConst & const_column = checkAndGetColumnConst<ColumnString>(*column.column);
+        return const_column.getValue<String>();
     };
 
     size_t arg = 0;
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 4f75042ad8d..9766f34edca 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -948,12 +948,12 @@ private:
         bool cond_is_const = false;
         bool cond_is_true = false;
         bool cond_is_false = false;
-        if (const auto * const_arg = checkAndGetColumn<ColumnConst>(*arg_cond.column))
+        if (const auto * const_arg = checkAndGetColumn<ColumnConst>(&*arg_cond.column))
         {
             cond_is_const = true;
             not_const_condition = const_arg->getDataColumnPtr();
             ColumnPtr data_column = const_arg->getDataColumnPtr();
-            if (const auto * const_nullable_arg = checkAndGetColumn<ColumnNullable>(*data_column))
+            if (const auto * const_nullable_arg = checkAndGetColumn<ColumnNullable>(&*data_column))
             {
                 data_column = const_nullable_arg->getNestedColumnPtr();
                 if (!data_column->empty())
@@ -962,7 +962,7 @@ private:
 
             if (!data_column->empty())
             {
-                cond_is_true = !cond_is_null && checkAndGetColumn<ColumnUInt8>(*data_column)->getBool(0);
+                cond_is_true = !cond_is_null && checkAndGetColumn<ColumnUInt8>(*data_column).getBool(0);
                 cond_is_false = !cond_is_null && !cond_is_true;
             }
         }
@@ -975,12 +975,12 @@ private:
         else if (cond_is_false || cond_is_null)
             return castColumn(column2, result_type);
 
-        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*not_const_condition))
+        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*not_const_condition))
         {
             ColumnPtr new_cond_column = nullable->getNestedColumnPtr();
             size_t column_size = arg_cond.column->size();
 
-            if (checkAndGetColumn<ColumnUInt8>(*new_cond_column))
+            if (checkAndGetColumn<ColumnUInt8>(&*new_cond_column))
             {
                 auto nested_column_copy = new_cond_column->cloneResized(new_cond_column->size());
                 typeid_cast<ColumnUInt8 *>(nested_column_copy.get())->applyZeroMap(nullable->getNullMapData());
@@ -1027,12 +1027,12 @@ private:
     /// Const(size = 0, Int32(size = 1))
     static ColumnPtr recursiveGetNestedColumnWithoutNullable(const ColumnPtr & column)
     {
-        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*column))
+        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*column))
         {
             /// Nullable cannot contain Nullable
             return nullable->getNestedColumnPtr();
         }
-        else if (const auto * column_const = checkAndGetColumn<ColumnConst>(*column))
+        else if (const auto * column_const = checkAndGetColumn<ColumnConst>(&*column))
         {
             /// Save Constant, but remove Nullable
             return ColumnConst::create(recursiveGetNestedColumnWithoutNullable(column_const->getDataColumnPtr()), column->size());
@@ -1051,8 +1051,8 @@ private:
         const ColumnWithTypeAndName & arg_then = arguments[1];
         const ColumnWithTypeAndName & arg_else = arguments[2];
 
-        const auto * then_is_nullable = checkAndGetColumn<ColumnNullable>(*arg_then.column);
-        const auto * else_is_nullable = checkAndGetColumn<ColumnNullable>(*arg_else.column);
+        const auto * then_is_nullable = checkAndGetColumn<ColumnNullable>(&*arg_then.column);
+        const auto * else_is_nullable = checkAndGetColumn<ColumnNullable>(&*arg_else.column);
 
         if (!then_is_nullable && !else_is_nullable)
             return nullptr;
diff --git a/src/Functions/isNotNull.cpp b/src/Functions/isNotNull.cpp
index dd5182aeade..dd53c700221 100644
--- a/src/Functions/isNotNull.cpp
+++ b/src/Functions/isNotNull.cpp
@@ -46,7 +46,7 @@ public:
 
         if (isVariant(elem.type))
         {
-            const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column)->getLocalDiscriminators();
+            const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column).getLocalDiscriminators();
             auto res = DataTypeUInt8().createColumn();
             auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
             data.resize(discriminators.size());
@@ -57,17 +57,17 @@ public:
 
         if (elem.type->isLowCardinalityNullable())
         {
-            const auto * low_cardinality_column = checkAndGetColumn<ColumnLowCardinality>(*elem.column);
-            const size_t null_index = low_cardinality_column->getDictionary().getNullValueIndex();
+            const auto & low_cardinality_column = checkAndGetColumn<ColumnLowCardinality>(*elem.column);
+            const size_t null_index = low_cardinality_column.getDictionary().getNullValueIndex();
             auto res = DataTypeUInt8().createColumn();
             auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
-            data.resize(low_cardinality_column->size());
-            for (size_t i = 0; i != low_cardinality_column->size(); ++i)
-                data[i] = (low_cardinality_column->getIndexAt(i) != null_index);
+            data.resize(low_cardinality_column.size());
+            for (size_t i = 0; i != low_cardinality_column.size(); ++i)
+                data[i] = (low_cardinality_column.getIndexAt(i) != null_index);
             return res;
         }
 
-        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*elem.column))
+        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*elem.column))
         {
             /// Return the negated null map.
             auto res_column = ColumnUInt8::create(input_rows_count);
diff --git a/src/Functions/isNull.cpp b/src/Functions/isNull.cpp
index 4bf4e44f866..7a6dabab7af 100644
--- a/src/Functions/isNull.cpp
+++ b/src/Functions/isNull.cpp
@@ -48,7 +48,7 @@ public:
 
         if (isVariant(elem.type))
         {
-            const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column)->getLocalDiscriminators();
+            const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column).getLocalDiscriminators();
             auto res = DataTypeUInt8().createColumn();
             auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
             data.reserve(discriminators.size());
@@ -59,17 +59,17 @@ public:
 
         if (elem.type->isLowCardinalityNullable())
         {
-            const auto * low_cardinality_column = checkAndGetColumn<ColumnLowCardinality>(*elem.column);
-            size_t null_index = low_cardinality_column->getDictionary().getNullValueIndex();
+            const auto & low_cardinality_column = checkAndGetColumn<ColumnLowCardinality>(*elem.column);
+            size_t null_index = low_cardinality_column.getDictionary().getNullValueIndex();
             auto res = DataTypeUInt8().createColumn();
             auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
-            data.reserve(low_cardinality_column->size());
-            for (size_t i = 0; i != low_cardinality_column->size(); ++i)
-                data.push_back(low_cardinality_column->getIndexAt(i) == null_index);
+            data.reserve(low_cardinality_column.size());
+            for (size_t i = 0; i != low_cardinality_column.size(); ++i)
+                data.push_back(low_cardinality_column.getIndexAt(i) == null_index);
             return res;
         }
 
-        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*elem.column))
+        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*elem.column))
         {
             /// Merely return the embedded null map.
             return nullable->getNullMapColumnPtr();
diff --git a/src/Functions/minSampleSize.cpp b/src/Functions/minSampleSize.cpp
index a5826ef5c0e..f37b030c85a 100644
--- a/src/Functions/minSampleSize.cpp
+++ b/src/Functions/minSampleSize.cpp
@@ -102,14 +102,14 @@ struct ContinuousImpl
         auto baseline_argument = arguments[0];
         baseline_argument.column = baseline_argument.column->convertToFullColumnIfConst();
         auto baseline_column_untyped = castColumnAccurate(baseline_argument, float_64_type);
-        const auto * baseline_column = checkAndGetColumn<ColumnVector<Float64>>(*baseline_column_untyped);
-        const auto & baseline_column_data = baseline_column->getData();
+        const auto & baseline_column = checkAndGetColumn<ColumnVector<Float64>>(*baseline_column_untyped);
+        const auto & baseline_column_data = baseline_column.getData();
 
         auto sigma_argument = arguments[1];
         sigma_argument.column = sigma_argument.column->convertToFullColumnIfConst();
         auto sigma_column_untyped = castColumnAccurate(sigma_argument, float_64_type);
-        const auto * sigma_column = checkAndGetColumn<ColumnVector<Float64>>(*sigma_column_untyped);
-        const auto & sigma_column_data = sigma_column->getData();
+        const auto & sigma_column = checkAndGetColumn<ColumnVector<Float64>>(*sigma_column_untyped);
+        const auto & sigma_column_data = sigma_column.getData();
 
         const IColumn & col_mde = *arguments[2].column;
         const IColumn & col_power = *arguments[3].column;
diff --git a/src/Functions/multiIf.cpp b/src/Functions/multiIf.cpp
index 49c45d0c0be..8ea2a91f2de 100644
--- a/src/Functions/multiIf.cpp
+++ b/src/Functions/multiIf.cpp
@@ -198,7 +198,7 @@ public:
                 if (cond_col->onlyNull())
                     continue;
 
-                if (const auto * column_const = checkAndGetColumn<ColumnConst>(*cond_col))
+                if (const auto * column_const = checkAndGetColumn<ColumnConst>(&*cond_col))
                 {
                     Field value = column_const->getField();
 
diff --git a/src/Functions/readWkt.cpp b/src/Functions/readWkt.cpp
index 8dff297bcb1..ddc847b1ca5 100644
--- a/src/Functions/readWkt.cpp
+++ b/src/Functions/readWkt.cpp
@@ -51,14 +51,14 @@ public:
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & /*result_type*/, size_t input_rows_count) const override
     {
-        const auto * column_string = checkAndGetColumn<ColumnString>(arguments[0].column.get());
+        const auto & column_string = checkAndGetColumn<ColumnString>(*arguments[0].column);
 
         Serializer serializer;
         Geometry geometry;
 
         for (size_t i = 0; i < input_rows_count; ++i)
         {
-            const auto & str = column_string->getDataAt(i).toString();
+            const auto & str = column_string.getDataAt(i).toString();
             boost::geometry::read_wkt(str, geometry);
             serializer.add(geometry);
         }
diff --git a/src/Functions/repeat.cpp b/src/Functions/repeat.cpp
index 6f2078b7e48..84597f4eadc 100644
--- a/src/Functions/repeat.cpp
+++ b/src/Functions/repeat.cpp
@@ -238,9 +238,9 @@ public:
                 {
                     using DataType = std::decay_t<decltype(type)>;
                     using T = typename DataType::FieldType;
-                    const ColumnVector<T> * column = checkAndGetColumn<ColumnVector<T>>(col_num.get());
+                    const ColumnVector<T> & column = checkAndGetColumn<ColumnVector<T>>(*col_num);
                     auto col_res = ColumnString::create();
-                    RepeatImpl::vectorStrVectorRepeat(col->getChars(), col->getOffsets(), col_res->getChars(), col_res->getOffsets(), column->getData());
+                    RepeatImpl::vectorStrVectorRepeat(col->getChars(), col->getOffsets(), col_res->getChars(), col_res->getOffsets(), column.getData());
                     res = std::move(col_res);
                     return true;
                 }))
@@ -258,9 +258,9 @@ public:
                 {
                     using DataType = std::decay_t<decltype(type)>;
                     using T = typename DataType::FieldType;
-                    const ColumnVector<T> * column = checkAndGetColumn<ColumnVector<T>>(col_num.get());
+                    const ColumnVector<T> & column = checkAndGetColumn<ColumnVector<T>>(*col_num);
                     auto col_res = ColumnString::create();
-                    RepeatImpl::constStrVectorRepeat(copy_str, col_res->getChars(), col_res->getOffsets(), column->getData());
+                    RepeatImpl::constStrVectorRepeat(copy_str, col_res->getChars(), col_res->getOffsets(), column.getData());
                     res = std::move(col_res);
                     return true;
                 }))
diff --git a/src/Functions/seriesOutliersDetectTukey.cpp b/src/Functions/seriesOutliersDetectTukey.cpp
index da04d3b78d3..81fc904e16e 100644
--- a/src/Functions/seriesOutliersDetectTukey.cpp
+++ b/src/Functions/seriesOutliersDetectTukey.cpp
@@ -61,10 +61,10 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         ColumnPtr col = arguments[0].column;
-        const ColumnArray * col_arr = checkAndGetColumn<ColumnArray>(col.get());
+        const ColumnArray & col_arr = checkAndGetColumn<ColumnArray>(*col);
 
-        const IColumn & arr_data = col_arr->getData();
-        const ColumnArray::Offsets & arr_offsets = col_arr->getOffsets();
+        const IColumn & arr_data = col_arr.getData();
+        const ColumnArray::Offsets & arr_offsets = col_arr.getOffsets();
 
         ColumnPtr col_res;
         if (input_rows_count == 0)
diff --git a/src/Functions/seriesPeriodDetectFFT.cpp b/src/Functions/seriesPeriodDetectFFT.cpp
index fbaa2b14e64..e85b3a97c67 100644
--- a/src/Functions/seriesPeriodDetectFFT.cpp
+++ b/src/Functions/seriesPeriodDetectFFT.cpp
@@ -61,10 +61,10 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         ColumnPtr array_ptr = arguments[0].column;
-        const ColumnArray * array = checkAndGetColumn<ColumnArray>(array_ptr.get());
+        const ColumnArray & array = checkAndGetColumn<ColumnArray>(*array_ptr);
 
-        const IColumn & src_data = array->getData();
-        const ColumnArray::Offsets & offsets = array->getOffsets();
+        const IColumn & src_data = array.getData();
+        const ColumnArray::Offsets & offsets = array.getOffsets();
 
         auto res = ColumnFloat64::create(input_rows_count);
         auto & res_data = res->getData();
diff --git a/src/Functions/space.cpp b/src/Functions/space.cpp
index 03dc0d06719..4cfa629aa33 100644
--- a/src/Functions/space.cpp
+++ b/src/Functions/space.cpp
@@ -57,14 +57,14 @@ public:
     template <typename DataType>
     bool executeConstant(ColumnPtr col_times, ColumnString::Offsets & res_offsets, ColumnString::Chars & res_chars) const
     {
-        const ColumnConst * col_times_const = checkAndGetColumn<ColumnConst>(col_times.get());
+        const ColumnConst & col_times_const = checkAndGetColumn<ColumnConst>(*col_times);
 
-        const ColumnPtr & col_times_const_internal = col_times_const->getDataColumnPtr();
+        const ColumnPtr & col_times_const_internal = col_times_const.getDataColumnPtr();
         if (!checkAndGetColumn<typename DataType::ColumnType>(col_times_const_internal.get()))
             return false;
 
         using T = typename DataType::FieldType;
-        T times = col_times_const->getValue<T>();
+        T times = col_times_const.getValue<T>();
 
         if (times < 1)
             times = 0;
diff --git a/src/Functions/toStartOfInterval.cpp b/src/Functions/toStartOfInterval.cpp
index 7f25a317466..54aa1205a35 100644
--- a/src/Functions/toStartOfInterval.cpp
+++ b/src/Functions/toStartOfInterval.cpp
@@ -164,7 +164,7 @@ private:
 
         if (isDateTime64(time_column_type))
         {
-            const auto * time_column_vec = checkAndGetColumn<ColumnDateTime64>(time_column_col);
+            const auto * time_column_vec = checkAndGetColumn<ColumnDateTime64>(&time_column_col);
             auto scale = assert_cast<const DataTypeDateTime64 &>(time_column_type).getScale();
 
             if (time_column_vec)
@@ -172,13 +172,13 @@ private:
         }
         else if (isDateTime(time_column_type))
         {
-            const auto * time_column_vec = checkAndGetColumn<ColumnDateTime>(time_column_col);
+            const auto * time_column_vec = checkAndGetColumn<ColumnDateTime>(&time_column_col);
             if (time_column_vec)
                 return dispatchForIntervalColumn(assert_cast<const DataTypeDateTime &>(time_column_type), *time_column_vec, interval_column, result_type, time_zone);
         }
         else if (isDate(time_column_type))
         {
-            const auto * time_column_vec = checkAndGetColumn<ColumnDate>(time_column_col);
+            const auto * time_column_vec = checkAndGetColumn<ColumnDate>(&time_column_col);
             if (time_column_vec)
                 return dispatchForIntervalColumn(assert_cast<const DataTypeDate &>(time_column_type), *time_column_vec, interval_column, result_type, time_zone);
         }
diff --git a/src/Functions/ztest.cpp b/src/Functions/ztest.cpp
index 55e1b59a897..c2579263674 100644
--- a/src/Functions/ztest.cpp
+++ b/src/Functions/ztest.cpp
@@ -98,23 +98,23 @@ public:
         static const auto uint64_data_type = std::make_shared<DataTypeNumber<UInt64>>();
 
         auto column_successes_x = castColumnAccurate(arguments[0], uint64_data_type);
-        const auto & data_successes_x = checkAndGetColumn<ColumnVector<UInt64>>(column_successes_x.get())->getData();
+        const auto & data_successes_x = checkAndGetColumn<ColumnVector<UInt64>>(*column_successes_x).getData();
 
         auto column_successes_y = castColumnAccurate(arguments[1], uint64_data_type);
-        const auto & data_successes_y = checkAndGetColumn<ColumnVector<UInt64>>(column_successes_y.get())->getData();
+        const auto & data_successes_y = checkAndGetColumn<ColumnVector<UInt64>>(*column_successes_y).getData();
 
         auto column_trials_x = castColumnAccurate(arguments[2], uint64_data_type);
-        const auto & data_trials_x = checkAndGetColumn<ColumnVector<UInt64>>(column_trials_x.get())->getData();
+        const auto & data_trials_x = checkAndGetColumn<ColumnVector<UInt64>>(*column_trials_x).getData();
 
         auto column_trials_y = castColumnAccurate(arguments[3], uint64_data_type);
-        const auto & data_trials_y = checkAndGetColumn<ColumnVector<UInt64>>(column_trials_y.get())->getData();
+        const auto & data_trials_y = checkAndGetColumn<ColumnVector<UInt64>>(*column_trials_y).getData();
 
         static const auto float64_data_type = std::make_shared<DataTypeNumber<Float64>>();
 
         auto column_confidence_level = castColumnAccurate(arguments[4], float64_data_type);
-        const auto & data_confidence_level = checkAndGetColumn<ColumnVector<Float64>>(column_confidence_level.get())->getData();
+        const auto & data_confidence_level = checkAndGetColumn<ColumnVector<Float64>>(*column_confidence_level).getData();
 
-        String usevar = checkAndGetColumnConst<ColumnString>(arguments[5].column.get())->getValue<String>();
+        String usevar = checkAndGetColumnConst<ColumnString>(*arguments[5].column).getValue<String>();
 
         if (usevar != UNPOOLED && usevar != POOLED)
             throw Exception{ErrorCodes::BAD_ARGUMENTS,
diff --git a/src/Interpreters/BloomFilterHash.h b/src/Interpreters/BloomFilterHash.h
index 45098ecff99..8248e9e4469 100644
--- a/src/Interpreters/BloomFilterHash.h
+++ b/src/Interpreters/BloomFilterHash.h
@@ -108,7 +108,7 @@ struct BloomFilterHash
         {
             const auto * array_col = typeid_cast<const ColumnArray *>(column.get());
 
-            if (checkAndGetColumn<ColumnNullable>(array_col->getData()))
+            if (checkAndGetColumn<ColumnNullable>(&array_col->getData()))
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unexpected type {} of bloom filter index.", data_type->getName());
 
             const auto & offsets = array_col->getOffsets();
diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 9b05edbce36..0db998c14fc 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -216,7 +216,7 @@ static void correctNullabilityInplace(ColumnWithTypeAndName & column, bool nulla
     {
         /// We have to replace values masked by NULLs with defaults.
         if (column.column)
-            if (const auto * nullable_column = checkAndGetColumn<ColumnNullable>(*column.column))
+            if (const auto * nullable_column = checkAndGetColumn<ColumnNullable>(&*column.column))
                 column.column = JoinCommon::filterWithBlanks(column.column, nullable_column->getNullMapColumn().getData(), true);
 
         JoinCommon::removeColumnNullability(column);
diff --git a/src/Interpreters/InterpreterCheckQuery.cpp b/src/Interpreters/InterpreterCheckQuery.cpp
index ae8cef3f102..4a84a7bf570 100644
--- a/src/Interpreters/InterpreterCheckQuery.cpp
+++ b/src/Interpreters/InterpreterCheckQuery.cpp
@@ -334,10 +334,10 @@ public:
         if ((columns.size() != 3 && columns.size() != 5) || column_position_to_check >= columns.size())
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong number of columns: {}, position {}", columns.size(), column_position_to_check);
 
-        const auto * col = checkAndGetColumn<ColumnUInt8>(columns[column_position_to_check].get());
-        for (size_t i = 0; i < col->size(); ++i)
+        const auto & col = checkAndGetColumn<ColumnUInt8>(*columns[column_position_to_check]);
+        for (size_t i = 0; i < col.size(); ++i)
         {
-            if (col->getElement(i) == 0)
+            if (col.getElement(i) == 0)
             {
                 result_value = 0;
                 return;
diff --git a/src/Interpreters/JoinUtils.cpp b/src/Interpreters/JoinUtils.cpp
index 0aee96ee9c4..1788c9aca48 100644
--- a/src/Interpreters/JoinUtils.cpp
+++ b/src/Interpreters/JoinUtils.cpp
@@ -162,7 +162,7 @@ static ColumnPtr tryConvertColumnToNullable(ColumnPtr col)
             return col_lc.cloneNullable();
         }
     }
-    else if (const ColumnConst * col_const = checkAndGetColumn<ColumnConst>(*col))
+    else if (const ColumnConst * col_const = checkAndGetColumn<ColumnConst>(&*col))
     {
         const auto & nested = col_const->getDataColumnPtr();
         if (nested->isNullable() || nested->canBeInsideNullable())
@@ -232,7 +232,7 @@ void removeColumnNullability(ColumnWithTypeAndName & column)
         if (column.column && column.column->isNullable())
         {
             column.column = column.column->convertToFullColumnIfConst();
-            const auto * nullable_col = checkAndGetColumn<ColumnNullable>(*column.column);
+            const auto * nullable_col = checkAndGetColumn<ColumnNullable>(column.column.get());
             if (!nullable_col)
             {
                 throw DB::Exception(ErrorCodes::LOGICAL_ERROR, "Column '{}' is expected to be nullable", column.dumpStructure());
@@ -258,11 +258,11 @@ void changeColumnRepresentation(const ColumnPtr & src_column, ColumnPtr & dst_co
 
     if (nullable_src && !nullable_dst)
     {
-        const auto * nullable = checkAndGetColumn<ColumnNullable>(*src_column);
+        const auto & nullable = checkAndGetColumn<ColumnNullable>(*src_column);
         if (change_lowcard)
-            dst_column = changeLowCardinality(nullable->getNestedColumnPtr(), dst_column);
+            dst_column = changeLowCardinality(nullable.getNestedColumnPtr(), dst_column);
         else
-            dst_column = nullable->getNestedColumnPtr();
+            dst_column = nullable.getNestedColumnPtr();
     }
     else if (!nullable_src && nullable_dst)
     {
@@ -275,7 +275,7 @@ void changeColumnRepresentation(const ColumnPtr & src_column, ColumnPtr & dst_co
     {
         if (change_lowcard)
         {
-            if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*src_column))
+            if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*src_column))
             {
                 dst_column = makeNullable(changeLowCardinality(nullable->getNestedColumnPtr(), dst_not_null));
                 assert_cast<ColumnNullable &>(*dst_column->assumeMutable()).applyNullMap(nullable->getNullMapColumn());
@@ -291,7 +291,7 @@ void changeColumnRepresentation(const ColumnPtr & src_column, ColumnPtr & dst_co
 ColumnPtr emptyNotNullableClone(const ColumnPtr & column)
 {
     if (column->isNullable())
-        return checkAndGetColumn<ColumnNullable>(*column)->getNestedColumnPtr()->cloneEmpty();
+        return checkAndGetColumn<ColumnNullable>(*column).getNestedColumnPtr()->cloneEmpty();
     return column->cloneEmpty();
 }
 
@@ -374,10 +374,10 @@ ColumnRawPtrs extractKeysForJoin(const Block & block_keys, const Names & key_nam
         key_columns[i] = block_keys.getByName(column_name).column.get();
 
         /// We will join only keys, where all components are not NULL.
-        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*key_columns[i]))
+        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*key_columns[i]))
             key_columns[i] = &nullable->getNestedColumn();
 
-        if (const auto * sparse = checkAndGetColumn<ColumnSparse>(*key_columns[i]))
+        if (const auto * sparse = checkAndGetColumn<ColumnSparse>(&*key_columns[i]))
             key_columns[i] = &sparse->getValuesColumn();
     }
 
@@ -490,7 +490,7 @@ JoinMask getColumnAsMask(const Block & block, const String & column_name)
     if (isNothing(col_type))
         return JoinMask(false, block.rows());
 
-    if (const auto * const_cond = checkAndGetColumn<ColumnConst>(*src_col.column))
+    if (const auto * const_cond = checkAndGetColumn<ColumnConst>(&*src_col.column))
     {
         return JoinMask(const_cond->getBool(0), block.rows());
     }
diff --git a/src/Interpreters/MergeJoin.cpp b/src/Interpreters/MergeJoin.cpp
index 5bd49b3c971..c6df06cfac6 100644
--- a/src/Interpreters/MergeJoin.cpp
+++ b/src/Interpreters/MergeJoin.cpp
@@ -80,8 +80,8 @@ int nullableCompareAt(const IColumn & left_column, const IColumn & right_column,
 
     if constexpr (has_left_nulls && has_right_nulls)
     {
-        const auto * left_nullable = checkAndGetColumn<ColumnNullable>(left_column);
-        const auto * right_nullable = checkAndGetColumn<ColumnNullable>(right_column);
+        const auto * left_nullable = checkAndGetColumn<ColumnNullable>(&left_column);
+        const auto * right_nullable = checkAndGetColumn<ColumnNullable>(&right_column);
 
         if (left_nullable && right_nullable)
         {
@@ -99,7 +99,7 @@ int nullableCompareAt(const IColumn & left_column, const IColumn & right_column,
 
     if constexpr (has_left_nulls)
     {
-        if (const auto * left_nullable = checkAndGetColumn<ColumnNullable>(left_column))
+        if (const auto * left_nullable = checkAndGetColumn<ColumnNullable>(&left_column))
         {
             if (left_column.isNullAt(lhs_pos))
                 return null_direction_hint;
@@ -109,7 +109,7 @@ int nullableCompareAt(const IColumn & left_column, const IColumn & right_column,
 
     if constexpr (has_right_nulls)
     {
-        if (const auto * right_nullable = checkAndGetColumn<ColumnNullable>(right_column))
+        if (const auto * right_nullable = checkAndGetColumn<ColumnNullable>(&right_column))
         {
             if (right_column.isNullAt(rhs_pos))
                 return -null_direction_hint;
diff --git a/src/Interpreters/NullableUtils.cpp b/src/Interpreters/NullableUtils.cpp
index ce681b1d569..fa0ddae8c90 100644
--- a/src/Interpreters/NullableUtils.cpp
+++ b/src/Interpreters/NullableUtils.cpp
@@ -12,7 +12,7 @@ ColumnPtr extractNestedColumnsAndNullMap(ColumnRawPtrs & key_columns, ConstNullM
     if (key_columns.size() == 1)
     {
         auto & column = key_columns[0];
-        if (const auto * column_nullable = checkAndGetColumn<ColumnNullable>(*column))
+        if (const auto * column_nullable = checkAndGetColumn<ColumnNullable>(&*column))
         {
             null_map_holder = column_nullable->getNullMapColumnPtr();
             null_map = &column_nullable->getNullMapData();
@@ -23,7 +23,7 @@ ColumnPtr extractNestedColumnsAndNullMap(ColumnRawPtrs & key_columns, ConstNullM
     {
         for (auto & column : key_columns)
         {
-            if (const auto * column_nullable = checkAndGetColumn<ColumnNullable>(*column))
+            if (const auto * column_nullable = checkAndGetColumn<ColumnNullable>(&*column))
             {
                 column = &column_nullable->getNestedColumn();
 
diff --git a/src/Interpreters/SetVariants.cpp b/src/Interpreters/SetVariants.cpp
index 0fb2e5189d4..64796a013f1 100644
--- a/src/Interpreters/SetVariants.cpp
+++ b/src/Interpreters/SetVariants.cpp
@@ -74,7 +74,7 @@ typename SetVariantsTemplate<Variant>::Type SetVariantsTemplate<Variant>::choose
 
     for (const auto & col : key_columns)
     {
-        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*col))
+        if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*col))
         {
             nested_key_columns.push_back(&nullable->getNestedColumn());
             has_nullable_key = true;
diff --git a/src/Interpreters/SetVariants.h b/src/Interpreters/SetVariants.h
index ff527102080..f6eac517349 100644
--- a/src/Interpreters/SetVariants.h
+++ b/src/Interpreters/SetVariants.h
@@ -80,7 +80,7 @@ protected:
 
         for (const auto & col : key_columns)
         {
-            if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*col))
+            if (const auto * nullable = checkAndGetColumn<ColumnNullable>(&*col))
             {
                 actual_columns.push_back(&nullable->getNestedColumn());
                 null_maps.push_back(&nullable->getNullMapColumn());
diff --git a/src/Processors/Transforms/CheckConstraintsTransform.cpp b/src/Processors/Transforms/CheckConstraintsTransform.cpp
index 3a6595ea4fb..e43aa6028da 100644
--- a/src/Processors/Transforms/CheckConstraintsTransform.cpp
+++ b/src/Processors/Transforms/CheckConstraintsTransform.cpp
@@ -57,7 +57,7 @@ void CheckConstraintsTransform::onConsume(Chunk chunk)
 
             auto result_column = res_column.column->convertToFullColumnIfConst()->convertToFullColumnIfLowCardinality();
 
-            if (const auto * column_nullable = checkAndGetColumn<ColumnNullable>(*result_column))
+            if (const auto * column_nullable = checkAndGetColumn<ColumnNullable>(&*result_column))
             {
                 const auto & nested_column = column_nullable->getNestedColumnPtr();
 
diff --git a/src/Processors/Transforms/MergeJoinTransform.cpp b/src/Processors/Transforms/MergeJoinTransform.cpp
index 584125b046f..92f4110e9ed 100644
--- a/src/Processors/Transforms/MergeJoinTransform.cpp
+++ b/src/Processors/Transforms/MergeJoinTransform.cpp
@@ -48,8 +48,8 @@ int nullableCompareAt(const IColumn & left_column, const IColumn & right_column,
 {
     if constexpr (has_left_nulls && has_right_nulls)
     {
-        const auto * left_nullable = checkAndGetColumn<ColumnNullable>(left_column);
-        const auto * right_nullable = checkAndGetColumn<ColumnNullable>(right_column);
+        const auto * left_nullable = checkAndGetColumn<ColumnNullable>(&left_column);
+        const auto * right_nullable = checkAndGetColumn<ColumnNullable>(&right_column);
 
         if (left_nullable && right_nullable)
         {
@@ -67,7 +67,7 @@ int nullableCompareAt(const IColumn & left_column, const IColumn & right_column,
 
     if constexpr (has_left_nulls)
     {
-        if (const auto * left_nullable = checkAndGetColumn<ColumnNullable>(left_column))
+        if (const auto * left_nullable = checkAndGetColumn<ColumnNullable>(&left_column))
         {
             if (left_nullable->isNullAt(lhs_pos))
                 return null_direction_hint;
@@ -77,7 +77,7 @@ int nullableCompareAt(const IColumn & left_column, const IColumn & right_column,
 
     if constexpr (has_right_nulls)
     {
-        if (const auto * right_nullable = checkAndGetColumn<ColumnNullable>(right_column))
+        if (const auto * right_nullable = checkAndGetColumn<ColumnNullable>(&right_column))
         {
             if (right_nullable->isNullAt(rhs_pos))
                 return -null_direction_hint;
diff --git a/src/Processors/Transforms/WindowTransform.cpp b/src/Processors/Transforms/WindowTransform.cpp
index f43b9a2e794..cf6a84db9e6 100644
--- a/src/Processors/Transforms/WindowTransform.cpp
+++ b/src/Processors/Transforms/WindowTransform.cpp
@@ -2516,7 +2516,7 @@ struct WindowFunctionNonNegativeDerivative final : public StatefulWindowFunction
         if (ts_scale_multiplier)
         {
             const auto & column = transform->blockAt(transform->current_row.block).input_columns[workspace.argument_column_indices[ARGUMENT_TIMESTAMP]];
-            const auto & curr_timestamp = checkAndGetColumn<DataTypeDateTime64::ColumnType>(column.get())->getInt(transform->current_row.row);
+            const auto & curr_timestamp = checkAndGetColumn<DataTypeDateTime64::ColumnType>(*column).getInt(transform->current_row.row);
 
             Float64 time_elapsed = curr_timestamp - state.previous_timestamp;
             result = (time_elapsed > 0) ? (metric_diff * ts_scale_multiplier / time_elapsed  * interval_duration) : 0;
diff --git a/src/Storages/MergeTree/MergeTreeIndexSet.cpp b/src/Storages/MergeTree/MergeTreeIndexSet.cpp
index dba2bc1e56c..1bd42518fdd 100644
--- a/src/Storages/MergeTree/MergeTreeIndexSet.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexSet.cpp
@@ -305,7 +305,7 @@ bool MergeTreeIndexConditionSet::mayBeTrueOnGranule(MergeTreeIndexGranulePtr idx
 
     const NullMap * null_map = nullptr;
 
-    if (const auto * col_nullable = checkAndGetColumn<ColumnNullable>(*column))
+    if (const auto * col_nullable = checkAndGetColumn<ColumnNullable>(&*column))
     {
         col_uint8 = typeid_cast<const ColumnUInt8 *>(&col_nullable->getNestedColumn());
         null_map = &col_nullable->getNullMapData();

From 694a8ca81992210dabfcf2da32004899263ae284 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Fri, 29 Mar 2024 23:33:12 +0000
Subject: [PATCH 093/289] Style

---
 src/Functions/FunctionHelpers.h | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/Functions/FunctionHelpers.h b/src/Functions/FunctionHelpers.h
index 89b224e79ef..9eabb9a0370 100644
--- a/src/Functions/FunctionHelpers.h
+++ b/src/Functions/FunctionHelpers.h
@@ -15,6 +15,11 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
 class IFunction;
 
 /// Methods, that helps dispatching over real column types.

From 4b9819a8f5d6b5407486a8d25bcf24dfdee8950f Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Mon, 6 May 2024 22:25:32 +0000
Subject: [PATCH 094/289] Update call sites added since last commit

---
 src/Functions/UTCTimestampTransform.cpp              | 12 ++++++------
 src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp |  4 ++--
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Functions/UTCTimestampTransform.cpp b/src/Functions/UTCTimestampTransform.cpp
index 0fcba91f49f..6d301270d8e 100644
--- a/src/Functions/UTCTimestampTransform.cpp
+++ b/src/Functions/UTCTimestampTransform.cpp
@@ -80,14 +80,14 @@ namespace
             const DateLUTImpl & utc_time_zone = DateLUT::instance("UTC");
             if (WhichDataType(arg1.type).isDateTime())
             {
-                const auto * date_time_col = checkAndGetColumn<ColumnDateTime>(arg1.column.get());
-                size_t col_size = date_time_col->size();
+                const auto & date_time_col = checkAndGetColumn<ColumnDateTime>(*arg1.column);
+                size_t col_size = date_time_col.size();
                 using ColVecTo = DataTypeDateTime::ColumnType;
                 typename ColVecTo::MutablePtr result_column = ColVecTo::create(col_size);
                 typename ColVecTo::Container & result_data = result_column->getData();
                 for (size_t i = 0; i < col_size; ++i)
                 {
-                    UInt32 date_time_val = date_time_col->getElement(i);
+                    UInt32 date_time_val = date_time_col.getElement(i);
                     LocalDateTime date_time(date_time_val, Name::to ? utc_time_zone : DateLUT::instance(time_zone_val));
                     time_t time_val = date_time.to_time_t(Name::from ? utc_time_zone : DateLUT::instance(time_zone_val));
                     result_data[i] = static_cast<UInt32>(time_val);
@@ -96,8 +96,8 @@ namespace
             }
             else if (WhichDataType(arg1.type).isDateTime64())
             {
-                const auto * date_time_col = checkAndGetColumn<ColumnDateTime64>(arg1.column.get());
-                size_t col_size = date_time_col->size();
+                const auto & date_time_col = checkAndGetColumn<ColumnDateTime64>(*arg1.column);
+                size_t col_size = date_time_col.size();
                 const DataTypeDateTime64 * date_time_type = static_cast<const DataTypeDateTime64 *>(arg1.type.get());
                 UInt32 col_scale = date_time_type->getScale();
                 Int64 scale_multiplier = DecimalUtils::scaleMultiplier<Int64>(col_scale);
@@ -106,7 +106,7 @@ namespace
                 typename ColDecimalTo::Container & result_data = result_column->getData();
                 for (size_t i = 0; i < col_size; ++i)
                 {
-                    DateTime64 date_time_val = date_time_col->getElement(i);
+                    DateTime64 date_time_val = date_time_col.getElement(i);
                     Int64 seconds = date_time_val.value / scale_multiplier;
                     Int64 micros = date_time_val.value % scale_multiplier;
                     LocalDateTime date_time(seconds, Name::to ? utc_time_zone : DateLUT::instance(time_zone_val));
diff --git a/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp b/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
index 4f25a014382..4b164f5ac42 100644
--- a/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
@@ -865,8 +865,8 @@ void MergeTreeIndexAggregatorBloomFilter::update(const Block & block, size_t * p
         const auto & column_and_type = block.getByName(index_columns_name[column]);
         auto index_column = BloomFilterHash::hashWithColumn(column_and_type.type, column_and_type.column, *pos, max_read_rows);
 
-        const auto & index_col = checkAndGetColumn<ColumnUInt64>(index_column.get());
-        const auto & index_data = index_col->getData();
+        const auto & index_col = checkAndGetColumn<ColumnUInt64>(*index_column);
+        const auto & index_data = index_col.getData();
         for (const auto & hash: index_data)
             column_hashes[column].insert(hash);
     }

From a20ef2a3d07343ff914f01db39b8dbb7e02d7584 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=D0=9A=D0=B8=D1=80=D0=B8=D0=BB=D0=BB=20=D0=93=D0=B0=D1=80?=
 =?UTF-8?q?=D0=B1=D0=B0=D1=80?= <st087492@student.spbu.ru>
Date: Tue, 7 May 2024 02:06:13 +0300
Subject: [PATCH 095/289] Add allow without connection setting to
 MaterializedMySQLSettings

---
 .../database-engines/materialized-mysql.md        |  3 +++
 src/Databases/MySQL/DatabaseMaterializedMySQL.cpp |  6 +++++-
 src/Databases/MySQL/MaterializedMySQLSettings.h   |  1 +
 .../materialized_with_ddl.py                      | 15 ++++++++++++++-
 4 files changed, 23 insertions(+), 2 deletions(-)

diff --git a/docs/en/engines/database-engines/materialized-mysql.md b/docs/en/engines/database-engines/materialized-mysql.md
index f32698f84f6..2b4d5fe04aa 100644
--- a/docs/en/engines/database-engines/materialized-mysql.md
+++ b/docs/en/engines/database-engines/materialized-mysql.md
@@ -51,6 +51,9 @@ ENGINE = MaterializedMySQL('host:port', ['database' | database], 'user', 'passwo
 ### allows_query_when_mysql_lost
 `allows_query_when_mysql_lost` — Allows to query a materialized table when MySQL is lost. Default: `0` (`false`).
 
+### allow_startup_database_without_connection_to_mysql
+`allow_startup_database_without_connection_to_mysql` — Allow to create and attach database without available connection to MySQL. Default: `0` (`false`).
+
 ### materialized_mysql_tables_list
 
 `materialized_mysql_tables_list` — a comma-separated list of mysql database tables, which will be replicated by MaterializedMySQL database engine. Default value: empty list — means whole tables will be replicated.
diff --git a/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp b/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
index 6d89cc23590..c81fe1b2b26 100644
--- a/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
+++ b/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
@@ -81,9 +81,13 @@ LoadTaskPtr DatabaseMaterializedMySQL::startupDatabaseAsync(AsyncLoader & async_
         base->goals(),
         TablesLoaderBackgroundStartupPoolId,
         fmt::format("startup MaterializedMySQL database {}", getDatabaseName()),
-        [this] (AsyncLoader &, const LoadJobPtr &)
+        [this, mode] (AsyncLoader &, const LoadJobPtr &)
         {
             LOG_TRACE(log, "Starting MaterializeMySQL database");
+            if (!settings->allow_startup_database_without_connection_to_mysql
+                && mode < LoadingStrictnessLevel::FORCE_ATTACH)
+                materialize_thread.assertMySQLAvailable();
+
             materialize_thread.startSynchronization();
             started_up = true;
         });
diff --git a/src/Databases/MySQL/MaterializedMySQLSettings.h b/src/Databases/MySQL/MaterializedMySQLSettings.h
index 557d48be85b..b481846afc1 100644
--- a/src/Databases/MySQL/MaterializedMySQLSettings.h
+++ b/src/Databases/MySQL/MaterializedMySQLSettings.h
@@ -22,6 +22,7 @@ class ASTStorage;
     M(UInt64, max_milliseconds_to_wait_in_binlog_queue, 10000, "Max milliseconds to wait when max bytes exceeded in a binlog queue.", 0) \
     M(UInt64, max_bytes_in_binlog_dispatcher_buffer, DBMS_DEFAULT_BUFFER_SIZE, "Max bytes in the binlog dispatcher's buffer before it is flushed to attached binlogs.", 0) \
     M(UInt64, max_flush_milliseconds_in_binlog_dispatcher, 1000, "Max milliseconds in the binlog dispatcher's buffer to wait before it is flushed to attached binlogs.", 0) \
+    M(Bool, allow_startup_database_without_connection_to_mysql, false, "Allow to create and attach database without available connection to MySQL.", 0) \
 
     DECLARE_SETTINGS_TRAITS(MaterializedMySQLSettingsTraits, LIST_OF_MATERIALIZE_MODE_SETTINGS)
 
diff --git a/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py b/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
index dcb2546bad3..86000799ae4 100644
--- a/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
+++ b/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
@@ -3425,8 +3425,21 @@ def mysql_create_database_without_connection(clickhouse_node, mysql_node, servic
 
     clickhouse_node.cluster.pause_container(service_name)
 
+    assert "ConnectionFailed:" in clickhouse_node.query_and_get_error(
+        """
+        CREATE DATABASE create_without_connection
+        ENGINE = MaterializedMySQL('{}:3306', 'create_without_connection', 'root', 'clickhouse')
+        """.format(
+            service_name
+        )
+    )
+
     clickhouse_node.query(
-        "CREATE DATABASE create_without_connection ENGINE = MaterializedMySQL('{}:3306', 'create_without_connection', 'root', 'clickhouse') SETTINGS max_wait_time_when_mysql_unavailable=-1".format(
+        """
+        CREATE DATABASE create_without_connection
+        ENGINE = MaterializedMySQL('{}:3306', 'create_without_connection', 'root', 'clickhouse')
+        SETTINGS allow_startup_database_without_connection_to_mysql=1
+        """.format(
             service_name
         )
     )

From d37590aed68e12c5fd7664b1a21138dd428d1482 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 7 May 2024 10:36:44 +0800
Subject: [PATCH 096/289] [update] add test for RawWithNames,
 RawWithNamesAndTypes and *WithNames, *WithNamesAndTypes; add changelog

---
 CHANGELOG.md                                  |  1 +
 .../00397_tsv_format_synonym.reference        | 27 +++++++++++++++++++
 .../0_stateless/00397_tsv_format_synonym.sql  |  8 ++++++
 3 files changed, 36 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index f40c42c4462..955e2f5b72f 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -33,6 +33,7 @@
 * A mode for `topK`/`topkWeighed` support mode, which return count of values and its error. [#54508](https://github.com/ClickHouse/ClickHouse/pull/54508) ([UnamedRus](https://github.com/UnamedRus)).
 * Added function `toMillisecond` which returns the millisecond component for values of type`DateTime` or `DateTime64`. [#60281](https://github.com/ClickHouse/ClickHouse/pull/60281) ([Shaun Struwig](https://github.com/Blargian)).
 * Allow configuring HTTP redirect handlers for clickhouse-server. For example, you can make `/` redirect to the Play UI. [#60390](https://github.com/ClickHouse/ClickHouse/pull/60390) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Allow Raw as a synonym for TSVRaw. [#63394](https://github.com/ClickHouse/ClickHouse/pull/63394) ([Unalian](https://github.com/Unalian))
 
 #### Performance Improvement
 * Optimized function `dotProduct` to omit unnecessary and expensive memory copies. [#60928](https://github.com/ClickHouse/ClickHouse/pull/60928) ([Robert Schulze](https://github.com/rschu1ze)).
diff --git a/tests/queries/0_stateless/00397_tsv_format_synonym.reference b/tests/queries/0_stateless/00397_tsv_format_synonym.reference
index c91169a06fa..3326b039b8d 100644
--- a/tests/queries/0_stateless/00397_tsv_format_synonym.reference
+++ b/tests/queries/0_stateless/00397_tsv_format_synonym.reference
@@ -31,3 +31,30 @@ UInt8	String	String
 1	hello	world
 2	hello	world
 3	hello	world
+arr	s1	s2
+1	hello	world
+2	hello	world
+3	hello	world
+arr	s1	s2
+1	hello	world
+2	hello	world
+3	hello	world
+arr	s1	s2
+1	hello	world
+2	hello	world
+3	hello	world
+arr	s1	s2
+UInt8	String	String
+1	hello	world
+2	hello	world
+3	hello	world
+arr	s1	s2
+UInt8	String	String
+1	hello	world
+2	hello	world
+3	hello	world
+arr	s1	s2
+UInt8	String	String
+1	hello	world
+2	hello	world
+3	hello	world
diff --git a/tests/queries/0_stateless/00397_tsv_format_synonym.sql b/tests/queries/0_stateless/00397_tsv_format_synonym.sql
index 51283c6ced9..b3b231fbf3f 100644
--- a/tests/queries/0_stateless/00397_tsv_format_synonym.sql
+++ b/tests/queries/0_stateless/00397_tsv_format_synonym.sql
@@ -10,3 +10,11 @@ SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TSVWithN
 SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TabSeparatedRaw;
 SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TSVRaw;
 SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT Raw;
+
+SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TabSeparatedRawWithNames;
+SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TSVRawWithNames;
+SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT RawWithNames;
+
+SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TabSeparatedRawWithNamesAndTypes;
+SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT TSVRawWithNamesAndTypes;
+SELECT arrayJoin([1, 2, 3]) AS arr, 'hello' AS s1, 'world' AS s2 FORMAT RawWithNamesAndTypes;

From a8ae0074aa5563b8e65ae110fa5dc71313a81a77 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 7 May 2024 10:40:46 +0800
Subject: [PATCH 097/289] [fix] name->names

---
 docs/en/interfaces/formats.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 937dfb52609..0b108edc17f 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -206,7 +206,7 @@ SELECT * FROM nestedt FORMAT TSV
 Differs from `TabSeparated` format in that the rows are written without escaping.
 When parsing with this format, tabs or linefeeds are not allowed in each field.
 
-This format is also available under the name `TSVRaw`, `Raw`.
+This format is also available under the names `TSVRaw`, `Raw`.
 
 ## TabSeparatedWithNames {#tabseparatedwithnames}
 
@@ -241,14 +241,14 @@ This format is also available under the name `TSVWithNamesAndTypes`.
 Differs from `TabSeparatedWithNames` format in that the rows are written without escaping.
 When parsing with this format, tabs or linefeeds are not allowed in each field.
 
-This format is also available under the name `TSVRawWithNames`, `RawWithNames`.
+This format is also available under the names `TSVRawWithNames`, `RawWithNames`.
 
 ## TabSeparatedRawWithNamesAndTypes {#tabseparatedrawwithnamesandtypes}
 
 Differs from `TabSeparatedWithNamesAndTypes` format in that the rows are written without escaping.
 When parsing with this format, tabs or linefeeds are not allowed in each field.
 
-This format is also available under the name `TSVRawWithNamesAndNames`, `RawWithNamesAndNames`.
+This format is also available under the names `TSVRawWithNamesAndNames`, `RawWithNamesAndNames`.
 
 ## Template {#format-template}
 

From 0a1d852dfd52cc88502a7699d249328edb041976 Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Thu, 2 May 2024 21:35:32 +0000
Subject: [PATCH 098/289] Enable plain_rewritable metadata for local and azure

Enable plain_rewritable support for local and azure (azure_blob_storage)
metadata type.

- HDFS object storage currently does not support iteration
  and does not implement listObjects method. It's a blocker
  for enabling plain_rewritable metadata type with HDFS.
- StaticWeb object storage is read-only and works with
  its dedicated metadata type.
---
 .../ObjectStorages/ObjectStorageFactory.cpp   | 14 +++++--
 .../PlainRewritableObjectStorage.h            | 39 ++++++++++++++++++-
 .../ObjectStorages/S3/S3ObjectStorage.cpp     |  7 ----
 src/Disks/ObjectStorages/S3/S3ObjectStorage.h |  3 --
 .../03008_local_plain_rewritable.reference    | 22 +++++++++++
 .../03008_local_plain_rewritable.sh           | 35 +++++++++++++++++
 6 files changed, 106 insertions(+), 14 deletions(-)
 create mode 100644 tests/queries/0_stateless/03008_local_plain_rewritable.reference
 create mode 100755 tests/queries/0_stateless/03008_local_plain_rewritable.sh

diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index 7b949db268b..264ec2b258e 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -73,9 +73,17 @@ ObjectStoragePtr createObjectStorage(
         return std::make_shared<PlainObjectStorage<BaseObjectStorage>>(std::forward<Args>(args)...);
     else if (isPlainRewritableStorage(type, config, config_prefix))
     {
-        /// TODO(jkartseva@): Test support for generic disk type
-        if (type != ObjectStorageType::S3)
-            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "plain_rewritable metadata storage support is implemented only for S3");
+        /// HDFS object storage currently does not support iteration and does not implement listObjects method.
+        /// StaticWeb object storage is read-only and works with its dedicated metadata type.
+        constexpr auto supported_object_storage_types
+            = std::array{ObjectStorageType::S3, ObjectStorageType::Local, ObjectStorageType::Azure};
+        if (std::find(supported_object_storage_types.begin(), supported_object_storage_types.end(), type)
+            == supported_object_storage_types.end())
+            throw Exception(
+                ErrorCodes::NOT_IMPLEMENTED,
+                "plain_rewritable metadata storage support is not implemented for '{}' object storage",
+                DataSourceDescription{DataSourceType::ObjectStorage, type, MetadataStorageType::PlainRewritable, /*description*/ ""}
+                    .toString());
 
         return std::make_shared<PlainRewritableObjectStorage<BaseObjectStorage>>(std::forward<Args>(args)...);
     }
diff --git a/src/Disks/ObjectStorages/PlainRewritableObjectStorage.h b/src/Disks/ObjectStorages/PlainRewritableObjectStorage.h
index d71e995b490..2b116cff443 100644
--- a/src/Disks/ObjectStorages/PlainRewritableObjectStorage.h
+++ b/src/Disks/ObjectStorages/PlainRewritableObjectStorage.h
@@ -1,16 +1,26 @@
 #pragma once
 
 #include <Disks/ObjectStorages/IObjectStorage.h>
+#include <Common/ObjectStorageKeyGenerator.h>
+#include "CommonPathPrefixKeyGenerator.h"
 
 namespace DB
 {
 
+namespace ErrorCodes
+{
+extern const int LOGICAL_ERROR;
+}
 template <typename BaseObjectStorage>
 class PlainRewritableObjectStorage : public BaseObjectStorage
 {
 public:
     template <class... Args>
-    explicit PlainRewritableObjectStorage(Args &&... args) : BaseObjectStorage(std::forward<Args>(args)...)
+    explicit PlainRewritableObjectStorage(Args &&... args)
+        : BaseObjectStorage(std::forward<Args>(args)...)
+        /// A basic key generator is required for checking S3 capabilities,
+        /// it will be reset later by metadata storage.
+        , key_generator(createObjectStorageKeysGeneratorAsIsWithPrefix(BaseObjectStorage::getCommonKeyPrefix()))
     {
     }
 
@@ -19,6 +29,33 @@ public:
     bool isWriteOnce() const override { return false; }
 
     bool isPlain() const override { return true; }
+
+    ObjectStorageKey generateObjectKeyForPath(const std::string & path) const override;
+
+    ObjectStorageKey generateObjectKeyPrefixForDirectoryPath(const std::string & path) const override;
+
+    void setKeysGenerator(ObjectStorageKeysGeneratorPtr gen) override { key_generator = gen; }
+
+private:
+    ObjectStorageKeysGeneratorPtr key_generator;
 };
 
+
+template <typename BaseObjectStorage>
+ObjectStorageKey PlainRewritableObjectStorage<BaseObjectStorage>::generateObjectKeyForPath(const std::string & path) const
+{
+    if (!key_generator)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Key generator is not set");
+
+    return key_generator->generate(path, /* is_directory */ false);
+}
+
+template <typename BaseObjectStorage>
+ObjectStorageKey PlainRewritableObjectStorage<BaseObjectStorage>::generateObjectKeyPrefixForDirectoryPath(const std::string & path) const
+{
+    if (!key_generator)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Key generator is not set");
+
+    return key_generator->generate(path, /* is_directory */ true);
+}
 }
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
index 2eae8877f87..a58b37f1df9 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
@@ -574,13 +574,6 @@ ObjectStorageKey S3ObjectStorage::generateObjectKeyForPath(const std::string & p
     return key_generator->generate(path, /* is_directory */ false);
 }
 
-ObjectStorageKey S3ObjectStorage::generateObjectKeyPrefixForDirectoryPath(const std::string & path) const
-{
-    if (!key_generator)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Key generator is not set");
-
-    return key_generator->generate(path, /* is_directory */ true);
-}
 }
 
 #endif
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.h b/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
index ff66b00e47c..5eaab4b585c 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
@@ -159,12 +159,9 @@ public:
     bool supportParallelWrite() const override { return true; }
 
     ObjectStorageKey generateObjectKeyForPath(const std::string & path) const override;
-    ObjectStorageKey generateObjectKeyPrefixForDirectoryPath(const std::string & path) const override;
 
     bool isReadOnly() const override { return s3_settings.get()->read_only; }
 
-    void setKeysGenerator(ObjectStorageKeysGeneratorPtr gen) override { key_generator = gen; }
-
 private:
     void setNewSettings(std::unique_ptr<S3ObjectStorageSettings> && s3_settings_);
 
diff --git a/tests/queries/0_stateless/03008_local_plain_rewritable.reference b/tests/queries/0_stateless/03008_local_plain_rewritable.reference
new file mode 100644
index 00000000000..10fc932ca4d
--- /dev/null
+++ b/tests/queries/0_stateless/03008_local_plain_rewritable.reference
@@ -0,0 +1,22 @@
+10006
+0	0	0
+1	1	1
+1	2	0
+2	2	2
+2	2	2
+3	1	9
+3	3	3
+4	4	4
+4	7	7
+5	5	5
+10006
+0	0	0
+1	1	1
+1	2	0
+2	2	2
+2	2	2
+3	1	9
+3	3	3
+4	4	4
+4	7	7
+5	5	5
diff --git a/tests/queries/0_stateless/03008_local_plain_rewritable.sh b/tests/queries/0_stateless/03008_local_plain_rewritable.sh
new file mode 100755
index 00000000000..07fd013c911
--- /dev/null
+++ b/tests/queries/0_stateless/03008_local_plain_rewritable.sh
@@ -0,0 +1,35 @@
+#!/usr/bin/env bash
+# Tags: no-random-settings, no-replicated-database, no-shared-merge-tree
+# Tag no-random-settings: enable after root causing flakiness
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} --query "drop table if exists test_mt sync"
+
+${CLICKHOUSE_CLIENT} -nm --query "
+create table test_mt (a Int32, b Int64, c Int64) engine = MergeTree() partition by intDiv(a, 1000) order by tuple(a, b)
+settings disk = disk(
+    type = object_storage,
+    object_storage_type = local,
+    metadata_type = plain_rewritable,
+    path = '/var/lib/clickhouse/disks/local_plain_rewritable/')
+"
+
+${CLICKHOUSE_CLIENT} -nm --query "
+insert into test_mt (*) values (1, 2, 0), (2, 2, 2), (3, 1, 9), (4, 7, 7), (5, 10, 2), (6, 12, 5);
+insert into test_mt (*) select number, number, number from numbers_mt(10000);
+"
+
+${CLICKHOUSE_CLIENT} -nm --query "
+select count(*) from test_mt;
+select (*) from test_mt order by tuple(a, b) limit 10;
+"
+
+${CLICKHOUSE_CLIENT} --query "optimize table test_mt final"
+
+${CLICKHOUSE_CLIENT} -nm --query "
+select count(*) from test_mt;
+select (*) from test_mt order by tuple(a, b) limit 10;
+"

From c6f17b25e47ffcf96ff49f869f5ecd6b67b910b8 Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Fri, 3 May 2024 03:59:50 +0000
Subject: [PATCH 099/289] plain_rewritable: add integration test for Azure

---
 .../__init__.py                               |   0
 .../test.py                                   | 153 ++++++++++++++++++
 2 files changed, 153 insertions(+)
 create mode 100644 tests/integration/test_azure_blob_storage_plain_rewritable/__init__.py
 create mode 100644 tests/integration/test_azure_blob_storage_plain_rewritable/test.py

diff --git a/tests/integration/test_azure_blob_storage_plain_rewritable/__init__.py b/tests/integration/test_azure_blob_storage_plain_rewritable/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_azure_blob_storage_plain_rewritable/test.py b/tests/integration/test_azure_blob_storage_plain_rewritable/test.py
new file mode 100644
index 00000000000..96d116ec6a2
--- /dev/null
+++ b/tests/integration/test_azure_blob_storage_plain_rewritable/test.py
@@ -0,0 +1,153 @@
+import logging
+import os
+import random
+import string
+
+import pytest
+
+from helpers.cluster import ClickHouseCluster
+from azure.storage.blob import BlobServiceClient
+from test_storage_azure_blob_storage.test import azure_query
+
+NODE_NAME = "node"
+
+
+def generate_cluster_def(port):
+    path = os.path.join(
+        os.path.dirname(os.path.realpath(__file__)),
+        "./_gen/disk_storage_conf.xml",
+    )
+    os.makedirs(os.path.dirname(path), exist_ok=True)
+    with open(path, "w") as f:
+        f.write(
+            f"""<clickhouse>
+    <storage_configuration>
+        <disks>
+            <blob_storage_disk>
+                <type>object_storage</type>
+                <object_storage_type>azure_blob_storage</object_storage_type>
+                <metadata_type>plain_rewritable</metadata_type>
+                <storage_account_url>http://azurite1:{port}/devstoreaccount1</storage_account_url>
+                <container_name>cont</container_name>
+                <skip_access_check>true</skip_access_check>
+                <account_name>devstoreaccount1</account_name>
+                <account_key>Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==</account_key>
+                <max_single_part_upload_size>100000</max_single_part_upload_size>
+                <min_upload_part_size>100000</min_upload_part_size>
+                <max_single_download_retries>10</max_single_download_retries>
+                <max_single_read_retries>10</max_single_read_retries>
+            </blob_storage_disk>
+        </disks>
+        <policies>
+            <blob_storage_policy>
+                <volumes>
+                    <main>
+                        <disk>blob_storage_disk</disk>
+                    </main>
+                </volumes>
+            </blob_storage_policy>
+        </policies>
+    </storage_configuration>
+</clickhouse>
+"""
+        )
+    return path
+
+
+insert_values = [
+    "(0,'data'),(1,'data')",
+    ",".join(
+        f"({i},'{''.join(random.choices(string.ascii_lowercase, k=5))}')"
+        for i in range(10)
+    ),
+]
+
+
+@pytest.fixture(scope="module")
+def cluster():
+    try:
+        cluster = ClickHouseCluster(__file__)
+        port = cluster.azurite_port
+        path = generate_cluster_def(port)
+        cluster.add_instance(
+            NODE_NAME,
+            main_configs=[
+                path,
+            ],
+            with_azurite=True,
+            stay_alive=True,
+        )
+        logging.info("Starting cluster...")
+        cluster.start()
+        logging.info("Cluster started")
+
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def test_insert_select(cluster):
+    node = cluster.instances[NODE_NAME]
+
+    for index, value in enumerate(insert_values):
+        azure_query(
+            node,
+            """
+            CREATE TABLE test_{} (
+                id Int64,
+                data String
+            ) ENGINE=MergeTree()
+            ORDER BY id
+            SETTINGS storage_policy='blob_storage_policy'
+            """.format(
+                index
+            ),
+        )
+
+        azure_query(node, "INSERT INTO test_{} VALUES {}".format(index, value))
+        assert (
+            azure_query(
+                node, "SELECT * FROM test_{} ORDER BY id FORMAT Values".format(index)
+            )
+            == value
+        )
+
+
+def test_restart_server(cluster):
+    node = cluster.instances[NODE_NAME]
+
+    for index, value in enumerate(insert_values):
+        assert (
+            azure_query(
+                node, "SELECT * FROM test_{} ORDER BY id FORMAT Values".format(index)
+            )
+            == value
+        )
+    node.restart_clickhouse()
+
+    for index, value in enumerate(insert_values):
+        assert (
+            azure_query(
+                node, "SELECT * FROM test_{} ORDER BY id FORMAT Values".format(index)
+            )
+            == value
+        )
+
+
+def test_drop_table(cluster):
+    node = cluster.instances[NODE_NAME]
+
+    for index, value in enumerate(insert_values):
+        node.query("DROP TABLE IF EXISTS test_{} SYNC".format(index))
+
+    port = cluster.env_variables["AZURITE_PORT"]
+    connection_string = (
+        f"DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;"
+        f"AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;"
+        f"BlobEndpoint=http://127.0.0.1:{port}/devstoreaccount1;"
+    )
+    blob_service_client = BlobServiceClient.from_connection_string(connection_string)
+    containers = blob_service_client.list_containers()
+    for container in containers:
+        container_client = blob_service_client.get_container_client(container)
+        assert len(list(container_client.list_blobs())) == 0

From fcad15ffc2b7c5d4d1c9e9ce201ba9eb86d4a3d4 Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Sat, 4 May 2024 04:26:48 +0000
Subject: [PATCH 100/289] plain_rewritable: update docs

---
 docs/en/operations/storing-data.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 389c917d427..7005783dd60 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -371,6 +371,8 @@ is equal to
 </s3_plain_rewritable>
 ```
 
+Starting from `24.5` it is possible configure any object storage disk (`s3`, `azure`, `local`) using `plain_rewritable` metadata type.
+
 ### Using Azure Blob Storage {#azure-blob-storage}
 
 `MergeTree` family table engines can store data to [Azure Blob Storage](https://azure.microsoft.com/en-us/services/storage/blobs/) using a disk with type `azure_blob_storage`.

From 5e5477302a71e8959feb8daab1b9459e16b2e168 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Tue, 7 May 2024 09:31:39 +0200
Subject: [PATCH 101/289] Update
 src/Storages/MergeTree/MergeTreeReadPoolBase.cpp

Co-authored-by: Alexander Tokmakov <tavplubix@clickhouse.com>
---
 src/Storages/MergeTree/MergeTreeReadPoolBase.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp b/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
index c759a12e151..36673238f3b 100644
--- a/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
+++ b/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
@@ -130,7 +130,7 @@ MergeTreeReadTaskPtr MergeTreeReadPoolBase::createTask(
                 parent_part_name, {MergeTreeDataPartState::PreActive, MergeTreeDataPartState::Active, MergeTreeDataPartState::Outdated});
 
             if (!parent_part)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Did not find parent part {} for potentially broken projection part {}",
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Did not find parent part {} for projection part {}",
                             parent_part_name, data_part->getDataPartStorage().getFullPath());
 
             return parent_part_name;

From da4f6f7b6ce4d7c46f3bd1955352656fd2826f19 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 30 Apr 2024 16:35:57 +0300
Subject: [PATCH 102/289] Added recursive CTE documentation

---
 .../sql-reference/statements/select/with.md   | 235 +++++++++++++++++-
 1 file changed, 229 insertions(+), 6 deletions(-)

diff --git a/docs/en/sql-reference/statements/select/with.md b/docs/en/sql-reference/statements/select/with.md
index a59ef463419..84d3c02eca1 100644
--- a/docs/en/sql-reference/statements/select/with.md
+++ b/docs/en/sql-reference/statements/select/with.md
@@ -5,21 +5,21 @@ sidebar_label: WITH
 
 # WITH Clause
 
-ClickHouse supports Common Table Expressions ([CTE](https://en.wikipedia.org/wiki/Hierarchical_and_recursive_queries_in_SQL)) and substitutes the code defined in the `WITH` clause in all places of use for the rest of `SELECT` query. Named subqueries can be included to the current and child query context in places where table objects are allowed. Recursion is prevented by hiding the current level CTEs from the WITH expression. 
+ClickHouse supports Common Table Expressions ([CTE](https://en.wikipedia.org/wiki/Hierarchical_and_recursive_queries_in_SQL)) and substitutes the code defined in the `WITH` clause in all places of use for the rest of `SELECT` query. Named subqueries can be included to the current and child query context in places where table objects are allowed. Recursion is prevented by hiding the current level CTEs from the WITH expression.
 
 Please note that CTEs do not guarantee the same results in all places they are called because the query will be re-executed for each use case.
 
 An example of such behavior is below
 ``` sql
-with cte_numbers as 
+with cte_numbers as
 (
-    select 
-        num 
-    from generateRandom('num UInt64', NULL) 
+    select
+        num
+    from generateRandom('num UInt64', NULL)
     limit 1000000
 )
 select
-    count() 
+    count()
 from cte_numbers
 where num in (select num from cte_numbers)
 ```
@@ -87,3 +87,226 @@ LIMIT 10;
 WITH test1 AS (SELECT i + 1, j + 1 FROM test1)
 SELECT * FROM test1;
 ```
+
+# Recursive Queries
+
+The optional RECURSIVE modifier allows for a WITH query to refer to its own output. Example:
+
+**Example:** Sum integers from 1 throught 100
+
+```sql
+WITH RECURSIVE test_table AS (
+    SELECT 1 AS number
+UNION ALL
+    SELECT number + 1 FROM test_table WHERE number < 100
+)
+SELECT sum(number) FROM test_table;
+```
+
+``` text
+┌─sum(number)─┐
+│        5050 │
+└─────────────┘
+```
+
+The general form of a recursive `WITH` query is always a non-recursive term, then `UNION ALL`, then a recursive term, where only the recursive term can contain a reference to the query's own output. Recursive CTE query is executed as follows:
+
+1. Evaluate the non-recursive term. Place result of non-recursive term query in a temporary working table.
+2. As long as the working table is not empty, repeat these steps:
+    1. Evaluate the recursive term, substituting the current contents of the working table for the recursive self-reference. Place result of recursive term query in a temporary intermediate table.
+    2. Replace the contents of the working table with the contents of the intermediate table, then empty the intermediate table.
+
+Recursive queries are typically used to work with hierarchical or tree-structured data. For example, we can write a query that performs tree traversal:
+
+**Example:** Tree traversal
+
+First let's create tree table:
+
+```sql
+DROP TABLE IF EXISTS tree;
+CREATE TABLE tree
+(
+    id UInt64,
+    parent_id Nullable(UInt64),
+    data String
+) ENGINE = MergeTree ORDER BY id;
+
+INSERT INTO tree VALUES (0, NULL, 'ROOT'), (1, 0, 'Child_1'), (2, 0, 'Child_2'), (3, 1, 'Child_1_1');
+```
+
+We can traverse those tree with such query:
+
+**Example:** Tree traversal
+```sql
+WITH RECURSIVE search_tree AS (
+    SELECT id, parent_id, data
+    FROM tree t
+    WHERE t.id = 0
+UNION ALL
+    SELECT t.id, t.parent_id, t.data
+    FROM tree t, search_tree st
+    WHERE t.parent_id = st.id
+)
+SELECT * FROM search_tree;
+```
+
+```text
+┌─id─┬─parent_id─┬─data──────┐
+│  0 │      ᴺᵁᴸᴸ │ ROOT      │
+│  1 │         0 │ Child_1   │
+│  2 │         0 │ Child_2   │
+│  3 │         1 │ Child_1_1 │
+└────┴───────────┴───────────┘
+```
+
+## Search order
+
+To create a depth-first order, we compute for each result row an array of rows that we have already visited:
+
+**Example:** Tree traversal depth-first order
+```sql
+WITH RECURSIVE search_tree AS (
+    SELECT id, parent_id, data, [t.id] AS path
+    FROM tree t
+    WHERE t.id = 0
+UNION ALL
+    SELECT t.id, t.parent_id, t.data, arrayConcat(path, [t.id])
+    FROM tree t, search_tree st
+    WHERE t.parent_id = st.id
+)
+SELECT * FROM search_tree ORDER BY path;
+```
+
+```text
+┌─id─┬─parent_id─┬─data──────┬─path────┐
+│  0 │      ᴺᵁᴸᴸ │ ROOT      │ [0]     │
+│  1 │         0 │ Child_1   │ [0,1]   │
+│  3 │         1 │ Child_1_1 │ [0,1,3] │
+│  2 │         0 │ Child_2   │ [0,2]   │
+└────┴───────────┴───────────┴─────────┘
+```
+
+To create a breadth-first order, standard approach is to add column that tracks the depth of the search:
+
+**Example:** Tree traversal breadth-first order
+```sql
+WITH RECURSIVE search_tree AS (
+    SELECT id, parent_id, data, [t.id] AS path, toUInt64(0) AS depth
+    FROM tree t
+    WHERE t.id = 0
+UNION ALL
+    SELECT t.id, t.parent_id, t.data, arrayConcat(path, [t.id]), depth + 1
+    FROM tree t, search_tree st
+    WHERE t.parent_id = st.id
+)
+SELECT * FROM search_tree ORDER BY depth;
+```
+
+```text
+┌─id─┬─link─┬─data──────┬─path────┬─depth─┐
+│  0 │ ᴺᵁᴸᴸ │ ROOT      │ [0]     │     0 │
+│  1 │    0 │ Child_1   │ [0,1]   │     1 │
+│  2 │    0 │ Child_2   │ [0,2]   │     1 │
+│  3 │    1 │ Child_1_1 │ [0,1,3] │     2 │
+└────┴──────┴───────────┴─────────┴───────┘
+```
+
+## Cycle detection
+
+First let's create graph table:
+
+```sql
+DROP TABLE IF EXISTS graph;
+CREATE TABLE graph
+(
+    from UInt64,
+    to UInt64,
+    label String
+) ENGINE = MergeTree ORDER BY (from, to);
+
+INSERT INTO graph VALUES (1, 2, '1 -> 2'), (1, 3, '1 -> 3'), (2, 3, '2 -> 3'), (1, 4, '1 -> 4'), (4, 5, '4 -> 5');
+```
+
+We can traverse that graph with such query:
+
+**Example:** Graph traversal without cycle detection
+```sql
+WITH RECURSIVE search_graph AS (
+    SELECT from, to, label FROM graph g
+    UNION ALL
+    SELECT g.from, g.to, g.label
+    FROM graph g, search_graph sg
+    WHERE g.from = sg.to
+)
+SELECT DISTINCT * FROM search_graph ORDER BY from;
+```
+```text
+┌─from─┬─to─┬─label──┐
+│    1 │  4 │ 1 -> 4 │
+│    1 │  2 │ 1 -> 2 │
+│    1 │  3 │ 1 -> 3 │
+│    2 │  3 │ 2 -> 3 │
+│    4 │  5 │ 4 -> 5 │
+└──────┴────┴────────┘
+```
+
+But if we add cycle in that graph, previous query will fail with `Maximum recursive CTE evaluation depth` error:
+
+```sql
+INSERT INTO graph VALUES (5, 1, '5 -> 1');
+
+WITH RECURSIVE search_graph AS (
+    SELECT from, to, label FROM graph g
+UNION ALL
+    SELECT g.from, g.to, g.label
+    FROM graph g, search_graph sg
+    WHERE g.from = sg.to
+)
+SELECT DISTINCT * FROM search_graph ORDER BY from;
+```
+
+```text
+Code: 306. DB::Exception: Received from localhost:9000. DB::Exception: Maximum recursive CTE evaluation depth (1000) exceeded, during evaluation of search_graph AS (SELECT from, to, label FROM graph AS g UNION ALL SELECT g.from, g.to, g.label FROM graph AS g, search_graph AS sg WHERE g.from = sg.to). Consider raising max_recursive_cte_evaluation_depth setting.: While executing RecursiveCTESource. (TOO_DEEP_RECURSION)
+```
+
+The standard method for handling cycles is to compute an array of the already visited nodes:
+
+**Example:** Graph traversal with cycle detection
+```sql
+WITH RECURSIVE search_graph AS (
+    SELECT from, to, label, false AS is_cycle, [tuple(g.from, g.to)] AS path FROM graph g
+UNION ALL
+    SELECT g.from, g.to, g.label, has(path, tuple(g.from, g.to)), arrayConcat(sg.path, [tuple(g.from, g.to)])
+    FROM graph g, search_graph sg
+    WHERE g.from = sg.to AND NOT is_cycle
+)
+SELECT * FROM search_graph WHERE is_cycle ORDER BY from;
+```
+
+```text
+┌─from─┬─to─┬─label──┬─is_cycle─┬─path──────────────────────┐
+│    1 │  4 │ 1 -> 4 │ true     │ [(1,4),(4,5),(5,1),(1,4)] │
+│    4 │  5 │ 4 -> 5 │ true     │ [(4,5),(5,1),(1,4),(4,5)] │
+│    5 │  1 │ 5 -> 1 │ true     │ [(5,1),(1,4),(4,5),(5,1)] │
+└──────┴────┴────────┴──────────┴───────────────────────────┘
+```
+
+## Infinite queries
+
+It is also possible to use inifinite recursive CTE queries if `LIMIT` is used in outer query:
+
+**Example:** Infinite recursive CTE query
+```sql
+WITH RECURSIVE test_table AS (
+    SELECT 1 AS number
+UNION ALL
+    SELECT number + 1 FROM test_table
+)
+SELECT sum(number) FROM (SELECT number FROM test_table LIMIT 100);
+```
+
+```text
+┌─sum(number)─┐
+│        5050 │
+└─────────────┘
+```

From 0b59c24866a6e61989b907aed0219530d6503b30 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Thu, 2 May 2024 18:50:38 +0300
Subject: [PATCH 103/289] Fixed style check

---
 docs/en/sql-reference/statements/select/with.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/statements/select/with.md b/docs/en/sql-reference/statements/select/with.md
index 84d3c02eca1..ffde7a3fe54 100644
--- a/docs/en/sql-reference/statements/select/with.md
+++ b/docs/en/sql-reference/statements/select/with.md
@@ -92,7 +92,7 @@ SELECT * FROM test1;
 
 The optional RECURSIVE modifier allows for a WITH query to refer to its own output. Example:
 
-**Example:** Sum integers from 1 throught 100
+**Example:** Sum integers from 1 through 100
 
 ```sql
 WITH RECURSIVE test_table AS (
@@ -293,7 +293,7 @@ SELECT * FROM search_graph WHERE is_cycle ORDER BY from;
 
 ## Infinite queries
 
-It is also possible to use inifinite recursive CTE queries if `LIMIT` is used in outer query:
+It is also possible to use infinite recursive CTE queries if `LIMIT` is used in outer query:
 
 **Example:** Infinite recursive CTE query
 ```sql

From f50f28d413bf0ba8cd40dccdbb631c2283dc32f1 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 7 May 2024 12:11:01 +0200
Subject: [PATCH 104/289] Update 03145_non_loaded_projection_backup.sh

---
 .../queries/0_stateless/03145_non_loaded_projection_backup.sh  | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
index 721ed784fc2..36ae9843dc4 100755
--- a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
+++ b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
@@ -10,6 +10,7 @@ create table tp_1 (x Int32, y Int32, projection p (select x, y order by x)) engi
 insert into tp_1 select number, number from numbers(3);
 
 set mutations_sync = 2;
+system stop merges;
 
 alter table tp_1 add projection pp (select x, count() group by x);
 insert into tp_1 select number, number from numbers(4);
@@ -46,4 +47,4 @@ check table tp_1 settings check_query_single_value_result = 0;" | grep -o "Found
 $CLICKHOUSE_CLIENT -nm -q "
 set send_logs_level='fatal';
 check table tp_1"
-$CLICKHOUSE_CLIENT -q "drop table tp_1 sync"
+$CLICKHOUSE_CLIENT -q "drop table tp_1"

From 791278ba47676ef497c95a308eaca91698717f91 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 6 May 2024 21:45:22 +0200
Subject: [PATCH 105/289] Add logging after a failure with evaluating
 Replicated*MergeTree engine arguments.

---
 ...tractZooKeeperPathFromReplicatedTableDef.h |  3 +-
 .../MergeTree/registerStorageMergeTree.cpp    | 60 +++++++++++--------
 2 files changed, 36 insertions(+), 27 deletions(-)

diff --git a/src/Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h b/src/Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h
index 1bd58392201..5ef5e1db62e 100644
--- a/src/Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h
+++ b/src/Storages/MergeTree/extractZooKeeperPathFromReplicatedTableDef.h
@@ -11,8 +11,9 @@ class ASTCreateQuery;
 class Context;
 using ContextPtr = std::shared_ptr<const Context>;
 
-/// Extracts a zookeeper path from a specified CREATE TABLE query. Returns std::nullopt if fails.
+/// Extracts a zookeeper path from a specified CREATE TABLE query.
 /// The function checks the table engine and if it is Replicated*MergeTree then it takes the first argument and expands macros in it.
+/// Returns std::nullopt if the specified CREATE query doesn't describe a Replicated table or its arguments can't be evaluated.
 std::optional<String> extractZooKeeperPathFromReplicatedTableDef(const ASTCreateQuery & create_query, const ContextPtr & context);
 
 }
diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index 9b0200d5a1c..4244ccccfe0 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -296,9 +296,6 @@ static void extractZooKeeperPathAndReplicaNameFromEngineArgs(
         else
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Replica name must be a string literal{}", verbose_help_message);
 
-        if (replica_name.empty())
-            throw Exception(ErrorCodes::NO_REPLICA_NAME_GIVEN, "No replica name in config{}", verbose_help_message);
-
         expand_macro(ast_zk_path, ast_replica_name);
     }
     else if (is_extended_storage_def
@@ -332,38 +329,45 @@ static void extractZooKeeperPathAndReplicaNameFromEngineArgs(
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected two string literal arguments: zookeeper_path and replica_name");
 }
 
-/// Extracts a zookeeper path from a specified CREATE TABLE query. Returns std::nullopt if fails.
+/// Extracts a zookeeper path from a specified CREATE TABLE query.
 std::optional<String> extractZooKeeperPathFromReplicatedTableDef(const ASTCreateQuery & query, const ContextPtr & context)
 {
+    if (!query.storage || !query.storage->engine)
+        return {};
+
+    const String & engine_name = query.storage->engine->name;
+    if (!isReplicated(engine_name))
+        return {};
+
+    StorageID table_id{query.getDatabase(), query.getTable(), query.uuid};
+
+    ASTs engine_args;
+    if (query.storage->engine->arguments)
+        engine_args = query.storage->engine->arguments->children;
+    for (auto & engine_arg : engine_args)
+        engine_arg = engine_arg->clone();
+
+    LoadingStrictnessLevel mode = LoadingStrictnessLevel::CREATE;
+    String zookeeper_path;
+    String replica_name;
+    RenamingRestrictions renaming_restrictions;
+
     try
     {
-        if (!query.storage || !query.storage->engine)
-            return {};
-
-        const String & engine_name = query.storage->engine->name;
-        if (!isReplicated(engine_name))
-            return {};
-
-        StorageID table_id{query.getDatabase(), query.getTable(), query.uuid};
-        ASTs engine_args;
-        if (query.storage->engine->arguments)
-            engine_args = query.storage->engine->arguments->children;
-        for (auto & engine_arg : engine_args)
-            engine_arg = engine_arg->clone();
-        LoadingStrictnessLevel mode = LoadingStrictnessLevel::CREATE;
-        String zookeeper_path;
-        String replica_name;
-        RenamingRestrictions renaming_restrictions;
-
         extractZooKeeperPathAndReplicaNameFromEngineArgs(query, table_id, engine_name, engine_args, mode, context,
                                                          zookeeper_path, replica_name, renaming_restrictions);
-
-        return zookeeper_path;
     }
-    catch (...)
+    catch (Exception & e)
     {
-        return {};
+        if (e.code() == ErrorCodes::BAD_ARGUMENTS)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__, "Couldn't evaluate engine arguments");
+            return {};
+        }
+        throw;
     }
+
+    return zookeeper_path;
 }
 
 static StoragePtr create(const StorageFactory::Arguments & args)
@@ -539,6 +543,10 @@ static StoragePtr create(const StorageFactory::Arguments & args)
     {
         extractZooKeeperPathAndReplicaNameFromEngineArgs(args.query, args.table_id, args.engine_name, args.engine_args, args.mode,
                                                          args.getLocalContext(), zookeeper_path, replica_name, renaming_restrictions);
+
+        if (replica_name.empty())
+            throw Exception(ErrorCodes::NO_REPLICA_NAME_GIVEN, "No replica name in config{}", verbose_help_message);
+
         arg_cnt = engine_args.size(); /// Update `arg_cnt` here because extractZooKeeperPathAndReplicaNameFromEngineArgs() could add arguments.
         arg_num = 2;                  /// zookeeper_path and replica_name together are always two arguments.
     }

From e6926dc65d37658f48540490190398c91ea22273 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 7 May 2024 12:32:34 +0200
Subject: [PATCH 106/289] Update 03145_non_loaded_projection_backup.sh

---
 tests/queries/0_stateless/03145_non_loaded_projection_backup.sh | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
index 36ae9843dc4..d92b85a984f 100755
--- a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
+++ b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
@@ -10,7 +10,6 @@ create table tp_1 (x Int32, y Int32, projection p (select x, y order by x)) engi
 insert into tp_1 select number, number from numbers(3);
 
 set mutations_sync = 2;
-system stop merges;
 
 alter table tp_1 add projection pp (select x, count() group by x);
 insert into tp_1 select number, number from numbers(4);

From 0a580e84eaae0dff89ca5fd151b8c98d3b8f9adb Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 7 May 2024 12:41:06 +0200
Subject: [PATCH 107/289] Update 03145_non_loaded_projection_backup.sh

---
 tests/queries/0_stateless/03145_non_loaded_projection_backup.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
index d92b85a984f..6f0e00ce3fc 100755
--- a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
+++ b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
@@ -7,6 +7,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 $CLICKHOUSE_CLIENT -nm -q "
 drop table if exists tp_1;
 create table tp_1 (x Int32, y Int32, projection p (select x, y order by x)) engine = MergeTree order by y partition by intDiv(y, 100);
+system stop merges tp_1;
 insert into tp_1 select number, number from numbers(3);
 
 set mutations_sync = 2;

From fe18781bed4c26347cd7746dfc3be75745941eab Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Tue, 7 May 2024 18:41:37 +0800
Subject: [PATCH 108/289] batter

---
 .../02415_all_new_functions_must_be_documented.reference         | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
index 3ddf165dec0..a152066a460 100644
--- a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
+++ b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
@@ -201,6 +201,7 @@ cbrt
 ceil
 char
 cityHash64
+clamp
 coalesce
 concat
 concatAssumeInjective

From 1bae2d9d4ffa6b4757dc2aeccb9eccf89bebc072 Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Tue, 7 May 2024 12:57:14 +0200
Subject: [PATCH 109/289] update comment

---
 src/Storages/StorageS3.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 8a4e30fed1d..e65d0cb5be4 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -489,7 +489,8 @@ size_t StorageS3Source::DisclosedGlobIterator::estimatedKeysCount()
     {
         /// 1000 files were listed, and we cannot make any estimation of _how many more_ there are (because we list bucket lazily);
         /// If there are more objects in the bucket, limiting the number of streams is the last thing we may want to do
-        /// as it would lead to serious (up to <max_threads> times) reading performance degradation.
+        /// as it would lead to serious slow down of the execution, since objects are going
+        /// to be fetched sequentially rather than in-parallel with up to <max_threads> times.
         return std::numeric_limits<size_t>::max();
     }
     else

From 0609054e9849b915847cbd93cb3d76786eebe0cc Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 7 May 2024 21:09:33 +0800
Subject: [PATCH 110/289] [update] update a stateless case

---
 .../02187_async_inserts_all_formats.          | 52 +++++++++++++++++++
 .../02187_async_inserts_all_formats.reference |  3 ++
 2 files changed, 55 insertions(+)
 create mode 100644 tests/queries/0_stateless/02187_async_inserts_all_formats.

diff --git a/tests/queries/0_stateless/02187_async_inserts_all_formats. b/tests/queries/0_stateless/02187_async_inserts_all_formats.
new file mode 100644
index 00000000000..f42a6d39d4f
--- /dev/null
+++ b/tests/queries/0_stateless/02187_async_inserts_all_formats.
@@ -0,0 +1,52 @@
+Arrow
+ArrowStream
+Avro
+BSONEachRow
+CSV
+CSVWithNames
+CSVWithNamesAndTypes
+CustomSeparated
+CustomSeparatedWithNames
+CustomSeparatedWithNamesAndTypes
+JSON
+JSONColumns
+JSONColumnsWithMetadata
+JSONCompact
+JSONCompactColumns
+JSONCompactEachRow
+JSONCompactEachRowWithNames
+JSONCompactEachRowWithNamesAndTypes
+JSONCompactStringsEachRow
+JSONCompactStringsEachRowWithNames
+JSONCompactStringsEachRowWithNamesAndTypes
+JSONEachRow
+JSONLines
+JSONObjectEachRow
+JSONStringsEachRow
+MsgPack
+NDJSON
+Native
+ORC
+Parquet
+Raw
+RawWithNames
+RawWithNamesAndTypes
+RowBinary
+RowBinaryWithNames
+RowBinaryWithNamesAndTypes
+TSKV
+TSV
+TSVRaw
+TSVRawWithNames
+TSVRawWithNamesAndTypes
+TSVWithNames
+TSVWithNamesAndTypes
+TabSeparated
+TabSeparatedRaw
+TabSeparatedRawWithNames
+TabSeparatedRawWithNamesAndTypes
+TabSeparatedWithNames
+TabSeparatedWithNamesAndTypes
+Values
+LineAsString
+OK
diff --git a/tests/queries/0_stateless/02187_async_inserts_all_formats.reference b/tests/queries/0_stateless/02187_async_inserts_all_formats.reference
index 2de728b4cb4..f42a6d39d4f 100644
--- a/tests/queries/0_stateless/02187_async_inserts_all_formats.reference
+++ b/tests/queries/0_stateless/02187_async_inserts_all_formats.reference
@@ -28,6 +28,9 @@ NDJSON
 Native
 ORC
 Parquet
+Raw
+RawWithNames
+RawWithNamesAndTypes
 RowBinary
 RowBinaryWithNames
 RowBinaryWithNamesAndTypes

From 85f766f27c0cbd49e267334c3d184627b554e853 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 7 May 2024 21:11:45 +0800
Subject: [PATCH 111/289] [update] update a stateless case

---
 .../02187_async_inserts_all_formats.          | 52 -------------------
 1 file changed, 52 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02187_async_inserts_all_formats.

diff --git a/tests/queries/0_stateless/02187_async_inserts_all_formats. b/tests/queries/0_stateless/02187_async_inserts_all_formats.
deleted file mode 100644
index f42a6d39d4f..00000000000
--- a/tests/queries/0_stateless/02187_async_inserts_all_formats.
+++ /dev/null
@@ -1,52 +0,0 @@
-Arrow
-ArrowStream
-Avro
-BSONEachRow
-CSV
-CSVWithNames
-CSVWithNamesAndTypes
-CustomSeparated
-CustomSeparatedWithNames
-CustomSeparatedWithNamesAndTypes
-JSON
-JSONColumns
-JSONColumnsWithMetadata
-JSONCompact
-JSONCompactColumns
-JSONCompactEachRow
-JSONCompactEachRowWithNames
-JSONCompactEachRowWithNamesAndTypes
-JSONCompactStringsEachRow
-JSONCompactStringsEachRowWithNames
-JSONCompactStringsEachRowWithNamesAndTypes
-JSONEachRow
-JSONLines
-JSONObjectEachRow
-JSONStringsEachRow
-MsgPack
-NDJSON
-Native
-ORC
-Parquet
-Raw
-RawWithNames
-RawWithNamesAndTypes
-RowBinary
-RowBinaryWithNames
-RowBinaryWithNamesAndTypes
-TSKV
-TSV
-TSVRaw
-TSVRawWithNames
-TSVRawWithNamesAndTypes
-TSVWithNames
-TSVWithNamesAndTypes
-TabSeparated
-TabSeparatedRaw
-TabSeparatedRawWithNames
-TabSeparatedRawWithNamesAndTypes
-TabSeparatedWithNames
-TabSeparatedWithNamesAndTypes
-Values
-LineAsString
-OK

From 6f2a39b29131578acd10a79486f29f23e323e311 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Tue, 7 May 2024 15:32:10 +0200
Subject: [PATCH 112/289] Revert "Do in reverse order"

This reverts commit 0b0e97917e3e4ab27a17cbf14d9e73163a20adbe.
---
 src/Storages/MergeTree/MergeTreeRangeReader.cpp | 15 +++++++--------
 1 file changed, 7 insertions(+), 8 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeRangeReader.cpp b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
index 492e4065502..eb757e1d8c7 100644
--- a/src/Storages/MergeTree/MergeTreeRangeReader.cpp
+++ b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
@@ -1007,10 +1007,6 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
                 filterColumns(columns, read_result.final_filter);
             }
 
-            /// If columns not empty, then apply on-fly alter conversions if any required
-            if (!prewhere_info || prewhere_info->perform_alter_conversions)
-                merge_tree_reader->performRequiredConversions(columns);
-
             /// If some columns absent in part, then evaluate default values
             if (should_evaluate_missing_defaults)
             {
@@ -1022,6 +1018,9 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
                 merge_tree_reader->evaluateMissingDefaults(additional_columns, columns);
             }
 
+            /// If columns not empty, then apply on-fly alter conversions if any required
+            if (!prewhere_info || prewhere_info->perform_alter_conversions)
+                merge_tree_reader->performRequiredConversions(columns);
         }
 
         read_result.columns.reserve(read_result.columns.size() + columns.size());
@@ -1047,14 +1046,14 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
             bool should_evaluate_missing_defaults;
             merge_tree_reader->fillMissingColumns(columns, should_evaluate_missing_defaults, read_result.num_rows);
 
-            /// If result not empty, then apply on-fly alter conversions if any required
-            if (!prewhere_info || prewhere_info->perform_alter_conversions)
-                merge_tree_reader->performRequiredConversions(columns);
-
             /// If some columns absent in part, then evaluate default values
             if (should_evaluate_missing_defaults)
                 merge_tree_reader->evaluateMissingDefaults({}, columns);
 
+            /// If result not empty, then apply on-fly alter conversions if any required
+            if (!prewhere_info || prewhere_info->perform_alter_conversions)
+                merge_tree_reader->performRequiredConversions(columns);
+
             for (size_t i = 0; i < columns.size(); ++i)
                 read_result.columns[i] = std::move(columns[i]);
         }

From 49284724ef4b34bbc5112bfa63a99625e8d35fe7 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Tue, 7 May 2024 16:10:21 +0200
Subject: [PATCH 113/289] fix errorCodes in fast tests

---
 tests/queries/0_stateless/00909_arrayEnumerateUniq.sql | 2 +-
 tests/queries/0_stateless/01045_array_zip.sql          | 2 +-
 tests/queries/0_stateless/02354_parse_timedelta.sql    | 4 ++--
 tests/queries/0_stateless/02372_now_in_block.sql       | 2 +-
 tests/queries/0_stateless/02718_array_fold.sql         | 8 ++++----
 5 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql b/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
index 0bdb338e9d2..fe01b2185c2 100644
--- a/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
+++ b/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
@@ -152,7 +152,7 @@ DROP TABLE arrays_test;
 
 
 select '---------BAD';
-SELECT arrayEnumerateUniqRanked(); -- { serverError 42 }
+SELECT arrayEnumerateUniqRanked(); -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
 SELECT arrayEnumerateUniqRanked([]);
 SELECT arrayEnumerateUniqRanked(1); -- { serverError 36 }
 SELECT arrayEnumerateUniqRanked(2,[]); -- { serverError 36 }
diff --git a/tests/queries/0_stateless/01045_array_zip.sql b/tests/queries/0_stateless/01045_array_zip.sql
index 1a85e6a0874..a2d54c8ae3f 100644
--- a/tests/queries/0_stateless/01045_array_zip.sql
+++ b/tests/queries/0_stateless/01045_array_zip.sql
@@ -2,7 +2,7 @@ SELECT arrayZip(['a', 'b', 'c'], ['d', 'e', 'f']);
 
 SELECT arrayZip(['a', 'b', 'c'], ['d', 'e', 'f'], ['g', 'h', 'i']);
 
-SELECT arrayZip(); -- { serverError 42 }
+SELECT arrayZip(); -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
 
 SELECT arrayZip('a', 'b', 'c'); -- { serverError 43 }
 
diff --git a/tests/queries/0_stateless/02354_parse_timedelta.sql b/tests/queries/0_stateless/02354_parse_timedelta.sql
index 29f2bf9fdfc..e876de64374 100644
--- a/tests/queries/0_stateless/02354_parse_timedelta.sql
+++ b/tests/queries/0_stateless/02354_parse_timedelta.sql
@@ -11,8 +11,8 @@ SELECT parseTimeDelta('1s - 1ms : 1μs ; 1ns');
 SELECT parseTimeDelta('1.11s1.11ms1.11us1.11ns');
 
 -- invalid expressions
-SELECT parseTimeDelta(); -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
-SELECT parseTimeDelta('1yr', 1); -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
+SELECT parseTimeDelta(); -- {serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION}
+SELECT parseTimeDelta('1yr', 1); -- {serverError TOO_MANY_ARGUMENTS_FOR_FUNCTION}
 SELECT parseTimeDelta(1); -- {serverError ILLEGAL_TYPE_OF_ARGUMENT}
 SELECT parseTimeDelta(' '); -- {serverError BAD_ARGUMENTS}
 SELECT parseTimeDelta('-1yr'); -- {serverError BAD_ARGUMENTS}
diff --git a/tests/queries/0_stateless/02372_now_in_block.sql b/tests/queries/0_stateless/02372_now_in_block.sql
index 7c884c0ba7d..815f74e5845 100644
--- a/tests/queries/0_stateless/02372_now_in_block.sql
+++ b/tests/queries/0_stateless/02372_now_in_block.sql
@@ -1,4 +1,4 @@
 SELECT count() FROM (SELECT DISTINCT nowInBlock(), nowInBlock('Pacific/Pitcairn') FROM system.numbers LIMIT 2);
 SELECT nowInBlock(1); -- { serverError 43 }
 SELECT nowInBlock(NULL) IS NULL;
-SELECT nowInBlock('UTC', 'UTC'); -- { serverError 42 }
+SELECT nowInBlock('UTC', 'UTC'); -- { serverError TOO_MANY_ARGUMENTS_FOR_FUNCTION }
diff --git a/tests/queries/0_stateless/02718_array_fold.sql b/tests/queries/0_stateless/02718_array_fold.sql
index 7dee33c4705..73a3cebdda1 100644
--- a/tests/queries/0_stateless/02718_array_fold.sql
+++ b/tests/queries/0_stateless/02718_array_fold.sql
@@ -1,10 +1,10 @@
 SELECT '-- Negative tests';
-SELECT arrayFold(); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
-SELECT arrayFold(1); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
-SELECT arrayFold(1, toUInt64(0)); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
+SELECT arrayFold(); -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
+SELECT arrayFold(1); -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
+SELECT arrayFold(1, toUInt64(0)); -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
 SELECT arrayFold(1, emptyArrayUInt64(), toUInt64(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x -> x,  emptyArrayString(), toInt8(0)); -- { serverError TYPE_MISMATCH }
-SELECT arrayFold( acc,x -> x,  'not an array', toUInt8(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT arrayFold( acc,x -> x,  'not an array', toUInt8(0)); -- { serverError I02718_array_foldLLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x,y -> x,  [0, 1], 'not an array', toUInt8(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x -> x,  [0, 1], [2, 3], toUInt8(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x,y -> x,  [0, 1], [2, 3, 4], toUInt8(0)); -- { serverError SIZES_OF_ARRAYS_DONT_MATCH }

From d3155707e9fdf56671af19dd38388861468378a1 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Mon, 6 May 2024 12:09:12 +0000
Subject: [PATCH 114/289] no filter pushdow for group_by_use_nulls

---
 src/Processors/QueryPlan/AggregatingStep.h                | 1 +
 src/Processors/QueryPlan/Optimizations/filterPushDown.cpp | 3 +++
 2 files changed, 4 insertions(+)

diff --git a/src/Processors/QueryPlan/AggregatingStep.h b/src/Processors/QueryPlan/AggregatingStep.h
index f446ecec846..ae43295024a 100644
--- a/src/Processors/QueryPlan/AggregatingStep.h
+++ b/src/Processors/QueryPlan/AggregatingStep.h
@@ -59,6 +59,7 @@ public:
     const Aggregator::Params & getParams() const { return params; }
 
     const auto & getGroupingSetsParamsList() const { return grouping_sets_params; }
+    bool isGroupByUseNulls() const { return group_by_use_nulls; }
 
     bool inOrder() const { return !sort_description_for_merging.empty(); }
     bool explicitSortingRequired() const { return explicit_sorting_required_for_aggregation_in_order; }
diff --git a/src/Processors/QueryPlan/Optimizations/filterPushDown.cpp b/src/Processors/QueryPlan/Optimizations/filterPushDown.cpp
index 7dd526cbe95..5b3bcfc4468 100644
--- a/src/Processors/QueryPlan/Optimizations/filterPushDown.cpp
+++ b/src/Processors/QueryPlan/Optimizations/filterPushDown.cpp
@@ -428,6 +428,9 @@ size_t tryPushDownFilter(QueryPlan::Node * parent_node, QueryPlan::Nodes & nodes
         /// of the grouping sets, we could not push the filter down.
         if (aggregating->isGroupingSets())
         {
+            /// Cannot push down filter if type has been changed.
+            if (aggregating->isGroupByUseNulls())
+                return 0;
 
             const auto & actions = filter->getExpression();
             const auto & filter_node = actions->findInOutputs(filter->getFilterColumnName());

From fd75522ea8c8f5ccd0dd6251ea5bb5480823f9c4 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Mon, 6 May 2024 12:09:47 +0000
Subject: [PATCH 115/289] analyzer: fix select * with grouping sets

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 52efee03ae4..5fd49aa4541 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -4815,6 +4815,19 @@ ProjectionNames QueryAnalyzer::resolveMatcher(QueryTreeNodePtr & matcher_node, I
         }
     }
 
+    if (!scope.expressions_in_resolve_process_stack.hasAggregateFunction())
+    {
+        for (auto & [node, _] : matched_expression_nodes_with_names)
+        {
+            auto it = scope.nullable_group_by_keys.find(node);
+            if (it != scope.nullable_group_by_keys.end())
+            {
+                node = it->node->clone();
+                node->convertToNullable();
+            }
+        }
+    }
+
     std::unordered_map<const IColumnTransformerNode *, std::unordered_set<std::string>> strict_transformer_to_used_column_names;
     for (const auto & transformer : matcher_node_typed.getColumnTransformers().getNodes())
     {

From 063db335480331bf0003f220ab74d93797a8ab17 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Mon, 6 May 2024 12:10:11 +0000
Subject: [PATCH 116/289] verbose error

---
 src/Functions/FunctionHelpers.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/FunctionHelpers.cpp b/src/Functions/FunctionHelpers.cpp
index ce83a489a3d..b31127d3896 100644
--- a/src/Functions/FunctionHelpers.cpp
+++ b/src/Functions/FunctionHelpers.cpp
@@ -80,7 +80,7 @@ ColumnWithTypeAndName columnGetNested(const ColumnWithTypeAndName & col)
             return ColumnWithTypeAndName{ nullable_res, nested_type, col.name };
         }
         else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column for DataTypeNullable");
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} for DataTypeNullable", col.dumpStructure());
     }
     return col;
 }

From cf9bc27c0b80c17b887170c4182439de1c6e8643 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Mon, 6 May 2024 12:12:11 +0000
Subject: [PATCH 117/289] add test

---
 ...grouping_sets_use_nulls_pushdown.reference |  8 +++++
 ...03150_grouping_sets_use_nulls_pushdown.sql | 29 +++++++++++++++++++
 2 files changed, 37 insertions(+)
 create mode 100644 tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.reference
 create mode 100644 tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql

diff --git a/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.reference b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.reference
new file mode 100644
index 00000000000..e9f85e9052f
--- /dev/null
+++ b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.reference
@@ -0,0 +1,8 @@
+2023-01-05	hello, world
+2023-01-05	\N
+2023-01-05	hello, world
+2023-01-05	\N
+2023-01-05	10
+2023-01-05	10
+2023-01-05	hello, world
+2023-01-05	\N
diff --git a/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql
new file mode 100644
index 00000000000..0f057a1c99d
--- /dev/null
+++ b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql
@@ -0,0 +1,29 @@
+DROP TABLE IF EXISTS test_grouping_sets_predicate;
+
+CREATE TABLE test_grouping_sets_predicate ( day_ Date, type_1 String ) ENGINE=MergeTree ORDER BY day_;
+
+INSERT INTO test_grouping_sets_predicate SELECT toDate('2023-01-05') AS day_, 'hello, world' FROM numbers (10);
+
+SET group_by_use_nulls = true;
+
+SELECT *
+FROM ( SELECT day_, type_1 FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (day_, type_1), (day_) ) )
+WHERE day_ = '2023-01-05'
+ORDER BY ALL;
+
+
+SELECT *
+FROM ( SELECT * FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (day_, type_1), (day_) ) )
+WHERE day_ = '2023-01-05'
+ORDER BY ALL;
+
+SELECT *
+FROM ( SELECT day_, COUNT(*) FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (day_, type_1), (day_) ) )
+WHERE day_ = '2023-01-05'
+ORDER BY ALL;
+
+
+SELECT t2.*
+FROM ( SELECT t1.* FROM test_grouping_sets_predicate t1 GROUP BY GROUPING SETS ( (day_, type_1), (day_) ) ) t2
+WHERE day_ = '2023-01-05'
+ORDER BY ALL;

From cad9c97725e4943730d0dabaa3df2cdf008be948 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 7 May 2024 17:21:25 +0300
Subject: [PATCH 118/289] Analyzer setting max_streams_to_max_threads_ratio
 overflow fix

---
 .../AggregateFunctionSparkbar.cpp                  |  4 ++--
 src/Planner/PlannerJoinTree.cpp                    | 10 +++++++++-
 ...streams_to_max_threads_ratio_overflow.reference |  0
 ...g_max_streams_to_max_threads_ratio_overflow.sql | 14 ++++++++++++++
 4 files changed, 25 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/03148_setting_max_streams_to_max_threads_ratio_overflow.reference
 create mode 100644 tests/queries/0_stateless/03148_setting_max_streams_to_max_threads_ratio_overflow.sql

diff --git a/src/AggregateFunctions/AggregateFunctionSparkbar.cpp b/src/AggregateFunctions/AggregateFunctionSparkbar.cpp
index b6e538520a8..362ffbe20d2 100644
--- a/src/AggregateFunctions/AggregateFunctionSparkbar.cpp
+++ b/src/AggregateFunctions/AggregateFunctionSparkbar.cpp
@@ -253,9 +253,9 @@ private:
             else
             {
                 Y scaled;
-                bool has_overfllow = common::mulOverflow<Y>(y, levels_num, scaled);
+                bool has_overflow = common::mulOverflow<Y>(y, levels_num, scaled);
 
-                if (has_overfllow)
+                if (has_overflow)
                     y = y / (y_max / levels_num) + 1;
                 else
                     y = scaled / y_max + 1;
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 85cad1dcd69..094cf73dbc6 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -708,7 +708,15 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
 
         /// If necessary, we request more sources than the number of threads - to distribute the work evenly over the threads
         if (max_streams > 1 && !is_sync_remote)
-            max_streams = static_cast<size_t>(max_streams * settings.max_streams_to_max_threads_ratio);
+        {
+            if (auto streams_with_ratio = max_streams * settings.max_streams_to_max_threads_ratio; canConvertTo<size_t>(streams_with_ratio))
+                max_streams = static_cast<size_t>(streams_with_ratio);
+            else
+                throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND,
+                    "Exceeded limit for `max_streams` with `max_streams_to_max_threads_ratio`. "
+                    "Make sure that `max_streams * max_streams_to_max_threads_ratio` is in some reasonable boundaries, current value: {}",
+                    streams_with_ratio);
+        }
 
         if (table_node)
             table_expression_query_info.table_expression_modifiers = table_node->getTableExpressionModifiers();
diff --git a/tests/queries/0_stateless/03148_setting_max_streams_to_max_threads_ratio_overflow.reference b/tests/queries/0_stateless/03148_setting_max_streams_to_max_threads_ratio_overflow.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03148_setting_max_streams_to_max_threads_ratio_overflow.sql b/tests/queries/0_stateless/03148_setting_max_streams_to_max_threads_ratio_overflow.sql
new file mode 100644
index 00000000000..af326c15bd8
--- /dev/null
+++ b/tests/queries/0_stateless/03148_setting_max_streams_to_max_threads_ratio_overflow.sql
@@ -0,0 +1,14 @@
+DROP TABLE IF EXISTS test_table;
+CREATE TABLE test_table
+(
+    id UInt64,
+    value String
+) ENGINE = MergeTree ORDER BY id;
+
+INSERT INTO test_table VALUES (0, 'Value_0');
+
+SELECT * FROM test_table SETTINGS max_threads = 1025, max_streams_to_max_threads_ratio = -9223372036854775808, allow_experimental_analyzer = 1; -- { serverError PARAMETER_OUT_OF_BOUND }
+
+SELECT * FROM test_table SETTINGS max_threads = 1025, max_streams_to_max_threads_ratio = -9223372036854775808, allow_experimental_analyzer = 0; -- { serverError PARAMETER_OUT_OF_BOUND }
+
+DROP TABLE test_table;

From c67a43e3a7354c3db488df44c05e5a0d56a454c5 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Tue, 7 May 2024 14:37:39 +0000
Subject: [PATCH 119/289] better

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp      |  3 +++
 src/Analyzer/ValidationUtils.cpp               |  4 ++++
 ..._grouping_sets_use_nulls_pushdown.reference |  6 ++++++
 .../03150_grouping_sets_use_nulls_pushdown.sql | 18 ++++++++++++++++++
 .../0_stateless/03151_where_asterisk.reference |  1 +
 .../0_stateless/03151_where_asterisk.sql       |  3 +++
 6 files changed, 35 insertions(+)
 create mode 100644 tests/queries/0_stateless/03151_where_asterisk.reference
 create mode 100644 tests/queries/0_stateless/03151_where_asterisk.sql

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 5fd49aa4541..518c1272761 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -5021,7 +5021,10 @@ ProjectionNames QueryAnalyzer::resolveMatcher(QueryTreeNodePtr & matcher_node, I
             scope.scope_node->formatASTForErrorMessage());
     }
 
+    auto original_ast = matcher_node->getOriginalAST();
     matcher_node = std::move(list);
+    if (original_ast)
+        matcher_node->setOriginalAST(original_ast);
 
     return result_projection_names;
 }
diff --git a/src/Analyzer/ValidationUtils.cpp b/src/Analyzer/ValidationUtils.cpp
index 60cc1dd521f..45a916016ce 100644
--- a/src/Analyzer/ValidationUtils.cpp
+++ b/src/Analyzer/ValidationUtils.cpp
@@ -26,6 +26,10 @@ namespace
 
 void validateFilter(const QueryTreeNodePtr & filter_node, std::string_view exception_place_message, const QueryTreeNodePtr & query_node)
 {
+    if (filter_node->getNodeType() == QueryTreeNodeType::LIST)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS,
+            "Unsupported expression '{}' in filter", filter_node->formatASTForErrorMessage());
+
     auto filter_node_result_type = filter_node->getResultType();
     if (!filter_node_result_type->canBeUsedInBooleanContext())
         throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_COLUMN_FOR_FILTER,
diff --git a/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.reference b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.reference
index e9f85e9052f..209c455b6f5 100644
--- a/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.reference
+++ b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.reference
@@ -2,6 +2,12 @@
 2023-01-05	\N
 2023-01-05	hello, world
 2023-01-05	\N
+2023-01-05
+2023-01-05
+2023-01-05	hello, world
+2023-01-05	\N
+2023-01-05	hello, world
+2023-01-05	\N
 2023-01-05	10
 2023-01-05	10
 2023-01-05	hello, world
diff --git a/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql
index 0f057a1c99d..6162f55ac8f 100644
--- a/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql
+++ b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql
@@ -17,6 +17,24 @@ FROM ( SELECT * FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (day_
 WHERE day_ = '2023-01-05'
 ORDER BY ALL;
 
+SELECT *
+FROM ( SELECT day_ FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (day_, type_1), (day_) ) )
+WHERE day_ = '2023-01-05'
+ORDER BY *
+SETTINGS allow_experimental_analyzer=1;
+
+SELECT *
+FROM ( SELECT * FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (day_, type_1), (day_) ) )
+WHERE day_ = '2023-01-05'
+GROUP BY *
+SETTINGS allow_experimental_analyzer=1;
+
+SELECT *
+FROM ( SELECT * FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (*), (day_) ) )
+WHERE day_ = '2023-01-05'
+GROUP BY GROUPING SETS (*)
+SETTINGS allow_experimental_analyzer=1;
+
 SELECT *
 FROM ( SELECT day_, COUNT(*) FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (day_, type_1), (day_) ) )
 WHERE day_ = '2023-01-05'
diff --git a/tests/queries/0_stateless/03151_where_asterisk.reference b/tests/queries/0_stateless/03151_where_asterisk.reference
new file mode 100644
index 00000000000..8b137891791
--- /dev/null
+++ b/tests/queries/0_stateless/03151_where_asterisk.reference
@@ -0,0 +1 @@
+
diff --git a/tests/queries/0_stateless/03151_where_asterisk.sql b/tests/queries/0_stateless/03151_where_asterisk.sql
new file mode 100644
index 00000000000..4b01d6e165c
--- /dev/null
+++ b/tests/queries/0_stateless/03151_where_asterisk.sql
@@ -0,0 +1,3 @@
+SET allow_experimental_analyzer = 1;
+
+SELECT * FROM (SELECT 1) t1 WHERE *; -- { serverError BAD_ARGUMENTS }

From c45c1444355b740ed01fe1849f18f17c689d826b Mon Sep 17 00:00:00 2001
From: Yohann Jardin <yohann.jardin@telecomnancy.net>
Date: Tue, 7 May 2024 16:39:43 +0200
Subject: [PATCH 120/289] fix typo in fast tests

---
 tests/queries/0_stateless/02718_array_fold.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02718_array_fold.sql b/tests/queries/0_stateless/02718_array_fold.sql
index 73a3cebdda1..e59eae87fdf 100644
--- a/tests/queries/0_stateless/02718_array_fold.sql
+++ b/tests/queries/0_stateless/02718_array_fold.sql
@@ -4,7 +4,7 @@ SELECT arrayFold(1); -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
 SELECT arrayFold(1, toUInt64(0)); -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
 SELECT arrayFold(1, emptyArrayUInt64(), toUInt64(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x -> x,  emptyArrayString(), toInt8(0)); -- { serverError TYPE_MISMATCH }
-SELECT arrayFold( acc,x -> x,  'not an array', toUInt8(0)); -- { serverError I02718_array_foldLLEGAL_TYPE_OF_ARGUMENT }
+SELECT arrayFold( acc,x -> x,  'not an array', toUInt8(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x,y -> x,  [0, 1], 'not an array', toUInt8(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x -> x,  [0, 1], [2, 3], toUInt8(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x,y -> x,  [0, 1], [2, 3, 4], toUInt8(0)); -- { serverError SIZES_OF_ARRAYS_DONT_MATCH }

From 5117422c7bebd04e3511abff3b02fd26561cda13 Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Tue, 7 May 2024 14:48:50 +0000
Subject: [PATCH 121/289] init

---
 src/Core/Settings.h                           |  1 +
 src/Formats/FormatFactory.cpp                 |  1 +
 src/Formats/FormatSettings.h                  |  1 +
 .../Formats/Impl/PrettyBlockOutputFormat.cpp  | 10 +++++-----
 .../Impl/PrettyCompactBlockOutputFormat.cpp   |  4 ++--
 .../Impl/PrettySpaceBlockOutputFormat.cpp     |  4 ++--
 .../03132_pretty_format_break_line.reference  | 19 +++++++++++++++++++
 .../03132_pretty_format_break_line.sql        |  7 +++++++
 8 files changed, 38 insertions(+), 9 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index b4313d9af56..d640a556fb6 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1113,6 +1113,7 @@ class IColumn;
     \
     M(String, format_json_object_each_row_column_for_object_name, "", "The name of column that will be used as object names in JSONObjectEachRow format. Column type should be String", 0) \
     \
+    M(Bool, output_format_pretty_preserve_border_for_multiline_string, true, "Applies better rendering for multiline strings.", 0) \
     M(UInt64, output_format_pretty_max_rows, 10000, "Rows limit for Pretty formats.", 0) \
     M(UInt64, output_format_pretty_max_column_pad_width, 250, "Maximum width to pad all values in a column in Pretty formats.", 0) \
     M(UInt64, output_format_pretty_max_value_width, 10000, "Maximum width of value to display in Pretty formats. If greater - it will be cut.", 0) \
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index b7e9899da46..cca4c30f5e0 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -173,6 +173,7 @@ FormatSettings getFormatSettings(const ContextPtr & context, const Settings & se
     format_settings.pretty.max_value_width_apply_for_single_value = settings.output_format_pretty_max_value_width_apply_for_single_value;
     format_settings.pretty.highlight_digit_groups = settings.output_format_pretty_highlight_digit_groups;
     format_settings.pretty.output_format_pretty_row_numbers = settings.output_format_pretty_row_numbers;
+    format_settings.pretty.preserve_border_for_multiline_string = settings.output_format_pretty_preserve_border_for_multiline_string;
     format_settings.pretty.output_format_pretty_single_large_number_tip_threshold = settings.output_format_pretty_single_large_number_tip_threshold;
     format_settings.protobuf.input_flatten_google_wrappers = settings.input_format_protobuf_flatten_google_wrappers;
     format_settings.protobuf.output_nullables_with_google_wrappers = settings.output_format_protobuf_nullables_with_google_wrappers;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index da225a39ec9..e320ea8e6b6 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -282,6 +282,7 @@ struct FormatSettings
         SettingFieldUInt64Auto color{"auto"};
 
         bool output_format_pretty_row_numbers = false;
+        bool preserve_border_for_multiline_string = true;
         UInt64 output_format_pretty_single_large_number_tip_threshold = 1'000'000;
 
         enum class Charset
diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index 178d0b912e1..e23622bc2e5 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -38,7 +38,7 @@ void PrettyBlockOutputFormat::calculateWidths(
     max_padded_widths.resize_fill(num_columns);
     name_widths.resize(num_columns);
 
-    const bool need_cut_to_width = format_settings.pretty.max_value_width_apply_for_single_value || num_rows != 1 || num_columns != 1 || total_rows != 0;
+    const bool need_cut_to_width = format_settings.pretty.preserve_border_for_multiline_string && (format_settings.pretty.max_value_width_apply_for_single_value || num_rows != 1 || num_columns != 1 || total_rows != 0);
 
     /// Calculate widths of all values.
     String serialized_value;
@@ -333,7 +333,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
                 WriteBufferFromString out_serialize(serialized_value, AppendModeTag());
                 serializations[j]->serializeText(*columns[j], i, out_serialize, format_settings);
             }
-            if (cut_to_width)
+            if (cut_to_width && format_settings.pretty.preserve_border_for_multiline_string)
                 splitValueAtBreakLine(serialized_value, transferred_row[j], cur_width);
             has_transferred_row |= !transferred_row[j].empty() && cur_width <= cut_to_width;
 
@@ -345,7 +345,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
         writeReadableNumberTip(chunk);
         writeCString("\n", out);
 
-        if (has_transferred_row)
+        if (has_transferred_row && format_settings.pretty.preserve_border_for_multiline_string)
             writeTransferredRow(max_widths, header, transferred_row, cut_to_width, false);
     }
 
@@ -453,7 +453,7 @@ void PrettyBlockOutputFormat::writeValueWithPadding(
         value_width = format_settings.pretty.max_value_width;
         has_break_line = false;
     }
-    else if (!has_break_line)
+    else if (!has_break_line || !format_settings.pretty.preserve_border_for_multiline_string)
         value += ' ';
 
     auto write_padding = [&]()
@@ -478,7 +478,7 @@ void PrettyBlockOutputFormat::writeValueWithPadding(
         write_padding();
     }
 
-    if (has_break_line)
+    if (has_break_line && format_settings.pretty.preserve_border_for_multiline_string)
         writeString("…", out);
 }
 
diff --git a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
index 345b6c84ecd..1ccb6d713d7 100644
--- a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
@@ -182,7 +182,7 @@ void PrettyCompactBlockOutputFormat::writeRow(
             WriteBufferFromString out_serialize(serialized_value, AppendModeTag());
             serializations[j]->serializeText(*columns[j], row_num, out_serialize, format_settings);
         }
-        if (cut_to_width)
+        if (cut_to_width && format_settings.pretty.preserve_border_for_multiline_string)
             splitValueAtBreakLine(serialized_value, transferred_row[j], cur_width);
         has_transferred_row |= !transferred_row[j].empty() && cur_width <= cut_to_width;
 
@@ -194,7 +194,7 @@ void PrettyCompactBlockOutputFormat::writeRow(
     writeReadableNumberTip(chunk);
     writeCString("\n", out);
 
-    if (has_transferred_row)
+    if (has_transferred_row && format_settings.pretty.preserve_border_for_multiline_string)
         writeTransferredRow(max_widths, header, transferred_row, cut_to_width, false);
 }
 
diff --git a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
index 6940c20e25b..0ed8c4398e4 100644
--- a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
@@ -100,7 +100,7 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
                 WriteBufferFromString out_serialize(serialized_value, AppendModeTag());
                 serializations[column]->serializeText(*columns[column], row, out_serialize, format_settings);
             }
-            if (cut_to_width)
+            if (cut_to_width && format_settings.pretty.preserve_border_for_multiline_string)
                 splitValueAtBreakLine(serialized_value, transferred_row[column], cur_width);
             has_transferred_row |= !transferred_row[column].empty() && cur_width <= cut_to_width;
 
@@ -111,7 +111,7 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
         writeReadableNumberTip(chunk);
         writeChar('\n', out);
 
-        if (has_transferred_row)
+        if (has_transferred_row && format_settings.pretty.preserve_border_for_multiline_string)
             writeTransferredRow(max_widths, header, transferred_row, cut_to_width, true);
     }
 
diff --git a/tests/queries/0_stateless/03132_pretty_format_break_line.reference b/tests/queries/0_stateless/03132_pretty_format_break_line.reference
index a5282f89327..b7b59df24fc 100644
--- a/tests/queries/0_stateless/03132_pretty_format_break_line.reference
+++ b/tests/queries/0_stateless/03132_pretty_format_break_line.reference
@@ -86,3 +86,22 @@
 2. │  1 │ hello world │ hellow     …│
    │    │             │…мир         │
    └────┴─────────────┴─────────────┘
+┏━━━━┳━━━━━━━━━━━━━┳━━━━━━━━━━━━━┓
+┃ id ┃ value       ┃ value1      ┃
+┡━━━━╇━━━━━━━━━━━━━╇━━━━━━━━━━━━━┩
+│  0 │ привет
+world │ hello world │
+├────┼─────────────┼─────────────┤
+│  1 │ hello world │ hellow
+мир   │
+└────┴─────────────┴─────────────┘
+   ┏━━━━┳━━━━━━━━━━━━━┳━━━━━━━━━━━━━┓
+   ┃ id ┃ value       ┃ value1      ┃
+   ┡━━━━╇━━━━━━━━━━━━━╇━━━━━━━━━━━━━┩
+1. │  0 │ привет
+world │ hello world │
+   ├────┼─────────────┼─────────────┤
+2. │  1 │ hello world │ hellow
+мир   │
+   └────┴─────────────┴─────────────┘
+   
\ No newline at end of file
diff --git a/tests/queries/0_stateless/03132_pretty_format_break_line.sql b/tests/queries/0_stateless/03132_pretty_format_break_line.sql
index ecf967c1836..5f002d8df67 100644
--- a/tests/queries/0_stateless/03132_pretty_format_break_line.sql
+++ b/tests/queries/0_stateless/03132_pretty_format_break_line.sql
@@ -1,5 +1,7 @@
 DROP TABLE IF EXISTS t_break_line;
 
+SET output_format_pretty_preserve_border_for_multiline_string=1;
+
 CREATE TABLE t_break_line (id UInt64, value String, value1 String) ENGINE=MergeTree ORDER BY id;
 
 INSERT INTO t_break_line VALUES(0, 'hello\nworld', 'hello world');
@@ -30,4 +32,9 @@ INSERT INTO t_break_line VALUES(1, 'hello world', 'hellow\nмир');
 SELECT * FROM t_break_line ORDER BY id FORMAT PrettyMonoBlock SETTINGS output_format_pretty_row_numbers = 0;
 SELECT * FROM t_break_line ORDER BY id FORMAT PrettyMonoBlock;
 
+SET output_format_pretty_preserve_border_for_multiline_string=0;
+
+SELECT * FROM t_break_line ORDER BY id FORMAT PrettyMonoBlock SETTINGS output_format_pretty_row_numbers = 0;
+SELECT * FROM t_break_line ORDER BY id FORMAT PrettyMonoBlock;
+
 DROP TABLE t_break_line;
\ No newline at end of file

From ac485b612de0e7e79188fdb07cd63a3500f92132 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Tue, 7 May 2024 17:11:37 +0200
Subject: [PATCH 122/289] add setting to SettingsChangesHistory

---
 src/Core/SettingsChangesHistory.h | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index cd1cd341c29..9a3ed14dd7c 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -91,6 +91,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"cross_join_min_rows_to_compress", 0, 10000000, "A new setting."},
               {"cross_join_min_bytes_to_compress", 0, 1_GiB, "A new setting."},
               {"prefer_external_sort_block_bytes", 0, DEFAULT_BLOCK_SIZE * 256, "Prefer maximum block bytes for external sort, reduce the memory usage during merging."},
+              {"output_format_pretty_preserve_border_for_multiline_string", 1, 1, "Applies better rendering for multiline strings."},
               }},
     {"24.4", {{"input_format_json_throw_on_bad_escape_sequence", true, true, "Allow to save JSON strings with bad escape sequences"},
               {"max_parsing_threads", 0, 0, "Add a separate setting to control number of threads in parallel parsing from files"},

From 07472b3e95b8c0beceb8efc177872bb049faf6c6 Mon Sep 17 00:00:00 2001
From: Constantine Peresypkin <pconstantine@gmail.com>
Date: Wed, 10 Apr 2024 19:54:29 -0400
Subject: [PATCH 123/289] Add setting to force NULL for omitted fields

Fixes #60884
---
 src/Core/Settings.h                           |  1 +
 src/Core/SettingsChangesHistory.h             |  1 +
 src/Formats/FormatFactory.cpp                 |  1 +
 src/Formats/FormatSettings.h                  |  1 +
 .../Impl/BSONEachRowRowInputFormat.cpp        |  9 +++-
 .../Impl/JSONColumnsBlockInputFormatBase.cpp  |  3 ++
 .../Impl/JSONEachRowRowInputFormat.cpp        | 10 ++++-
 .../Formats/Impl/TSKVRowInputFormat.cpp       | 12 ++++-
 .../RowInputFormatWithNamesAndTypes.cpp       | 20 +++++++++
 .../03004_force_null_for_omitted.reference    | 44 +++++++++++++++++++
 .../03004_force_null_for_omitted.sql          | 36 +++++++++++++++
 11 files changed, 135 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/03004_force_null_for_omitted.reference
 create mode 100644 tests/queries/0_stateless/03004_force_null_for_omitted.sql

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index b4313d9af56..f80bf1e4e3e 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1006,6 +1006,7 @@ class IColumn;
     M(Bool, input_format_tsv_empty_as_default, false, "Treat empty fields in TSV input as default values.", 0) \
     M(Bool, input_format_tsv_enum_as_number, false, "Treat inserted enum values in TSV formats as enum indices.", 0) \
     M(Bool, input_format_null_as_default, true, "Initialize null fields with default values if the data type of this field is not nullable and it is supported by the input format", 0) \
+    M(Bool, input_format_force_null_for_omitted_fields, false, "Force initialize omitted fields with null values", 0) \
     M(Bool, input_format_arrow_case_insensitive_column_matching, false, "Ignore case when matching Arrow columns with CH columns.", 0) \
     M(Int64, input_format_orc_row_batch_size, 100'000, "Batch size when reading ORC stripes.", 0) \
     M(Bool, input_format_orc_case_insensitive_column_matching, false, "Ignore case when matching ORC columns with CH columns.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index cd1cd341c29..5ea99aa0192 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -91,6 +91,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"cross_join_min_rows_to_compress", 0, 10000000, "A new setting."},
               {"cross_join_min_bytes_to_compress", 0, 1_GiB, "A new setting."},
               {"prefer_external_sort_block_bytes", 0, DEFAULT_BLOCK_SIZE * 256, "Prefer maximum block bytes for external sort, reduce the memory usage during merging."},
+              {"input_format_force_null_for_omitted_fields", false, false, "Disable type-defaults for omitted fields when needed"},
               }},
     {"24.4", {{"input_format_json_throw_on_bad_escape_sequence", true, true, "Allow to save JSON strings with bad escape sequences"},
               {"max_parsing_threads", 0, 0, "Add a separate setting to control number of threads in parallel parsing from files"},
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index b7e9899da46..3199445864d 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -146,6 +146,7 @@ FormatSettings getFormatSettings(const ContextPtr & context, const Settings & se
     format_settings.json.throw_on_bad_escape_sequence = settings.input_format_json_throw_on_bad_escape_sequence;
     format_settings.json.ignore_unnecessary_fields = settings.input_format_json_ignore_unnecessary_fields;
     format_settings.null_as_default = settings.input_format_null_as_default;
+    format_settings.force_null_for_omitted_fields = settings.input_format_force_null_for_omitted_fields;
     format_settings.decimal_trailing_zeros = settings.output_format_decimal_trailing_zeros;
     format_settings.parquet.row_group_rows = settings.output_format_parquet_row_group_size;
     format_settings.parquet.row_group_bytes = settings.output_format_parquet_row_group_size_bytes;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index da225a39ec9..83b5c534297 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -32,6 +32,7 @@ struct FormatSettings
     bool write_statistics = true;
     bool import_nested_json = false;
     bool null_as_default = true;
+    bool force_null_for_omitted_fields = false;
     bool decimal_trailing_zeros = false;
     bool defaults_for_omitted_fields = true;
     bool is_writing_to_terminal = false;
diff --git a/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.cpp
index 340bcc8aae5..6a3475a1830 100644
--- a/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.cpp
@@ -39,6 +39,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_COLUMN;
     extern const int TOO_LARGE_STRING_SIZE;
     extern const int UNKNOWN_TYPE;
+    extern const int TYPE_MISMATCH;
 }
 
 namespace
@@ -820,7 +821,13 @@ bool BSONEachRowRowInputFormat::readRow(MutableColumns & columns, RowReadExtensi
     /// Fill non-visited columns with the default values.
     for (size_t i = 0; i < num_columns; ++i)
         if (!seen_columns[i])
-            header.getByPosition(i).type->insertDefaultInto(*columns[i]);
+        {
+            const auto & type = header.getByPosition(i).type;
+            if (format_settings.force_null_for_omitted_fields && !isNullableOrLowCardinalityNullable(type))
+                throw Exception(ErrorCodes::TYPE_MISMATCH, "Cannot insert NULL value into a column of type '{}' at index {}", type->getName(), i);
+            else
+                type->insertDefaultInto(*columns[i]);
+        }
 
     if (format_settings.defaults_for_omitted_fields)
         ext.read_columns = read_columns;
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
index faa4f36bbb0..e61e55efc8e 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
@@ -13,6 +13,7 @@ namespace ErrorCodes
 {
     extern const int INCORRECT_DATA;
     extern const int EMPTY_DATA_PASSED;
+    extern const int TYPE_MISMATCH;
 }
 
 
@@ -194,6 +195,8 @@ Chunk JSONColumnsBlockInputFormatBase::read()
     {
         if (!seen_columns[i])
         {
+            if (format_settings.force_null_for_omitted_fields && !isNullableOrLowCardinalityNullable(fields[i].type))
+                throw Exception(ErrorCodes::TYPE_MISMATCH, "Cannot insert NULL value into a column `{}` of type '{}'", fields[i].name, fields[i].type->getName());
             columns[i]->insertManyDefaults(rows);
             if (format_settings.defaults_for_omitted_fields)
                 block_missing_values.setBits(i, rows);
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
index a78d8d016cd..8855a1bc28d 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
@@ -18,6 +18,7 @@ namespace ErrorCodes
     extern const int INCORRECT_DATA;
     extern const int CANNOT_READ_ALL_DATA;
     extern const int LOGICAL_ERROR;
+    extern const int TYPE_MISMATCH;
 }
 
 namespace
@@ -233,7 +234,14 @@ bool JSONEachRowRowInputFormat::readRow(MutableColumns & columns, RowReadExtensi
     /// Fill non-visited columns with the default values.
     for (size_t i = 0; i < num_columns; ++i)
         if (!seen_columns[i])
-            header.getByPosition(i).type->insertDefaultInto(*columns[i]);
+        {
+            const auto & type = header.getByPosition(i).type;
+            if (format_settings.force_null_for_omitted_fields && !isNullableOrLowCardinalityNullable(type))
+                throw Exception(ErrorCodes::TYPE_MISMATCH, "Cannot insert NULL value into a column `{}` of type '{}'", columnName(i), type->getName());
+            else
+                type->insertDefaultInto(*columns[i]);
+        }
+
 
     /// Return info about defaults set.
     /// If defaults_for_omitted_fields is set to 0, we should just leave already inserted defaults.
diff --git a/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp b/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
index 29bc0012dc0..5382527fcdc 100644
--- a/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
@@ -15,6 +15,7 @@ namespace ErrorCodes
     extern const int CANNOT_PARSE_ESCAPE_SEQUENCE;
     extern const int CANNOT_READ_ALL_DATA;
     extern const int CANNOT_PARSE_INPUT_ASSERTION_FAILED;
+    extern const int TYPE_MISMATCH;
 }
 
 
@@ -190,7 +191,16 @@ bool TSKVRowInputFormat::readRow(MutableColumns & columns, RowReadExtension & ex
     /// Fill in the not met columns with default values.
     for (size_t i = 0; i < num_columns; ++i)
         if (!seen_columns[i])
-            header.getByPosition(i).type->insertDefaultInto(*columns[i]);
+        {
+            const auto & type = header.getByPosition(i).type;
+            if (format_settings.force_null_for_omitted_fields && !isNullableOrLowCardinalityNullable(type))
+                throw Exception(
+                    ErrorCodes::TYPE_MISMATCH,
+                    "Cannot insert NULL value into a column `{}` of type '{}'",
+                    header.getByPosition(i).name,
+                    type->getName());
+            type->insertDefaultInto(*columns[i]);
+        }
 
     /// return info about defaults set
     if (format_settings.defaults_for_omitted_fields)
diff --git a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
index 2ad6a825c8f..ae30d741c2f 100644
--- a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
+++ b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
@@ -18,6 +18,7 @@ namespace ErrorCodes
 {
     extern const int INCORRECT_DATA;
     extern const int LOGICAL_ERROR;
+    extern const int TYPE_MISMATCH;
 }
 
 namespace
@@ -124,6 +125,17 @@ void RowInputFormatWithNamesAndTypes::readPrefix()
             }
         }
     }
+
+    if (format_settings.force_null_for_omitted_fields)
+    {
+        for (auto index : column_mapping->not_presented_columns)
+            if (!isNullableOrLowCardinalityNullable(data_types[index]))
+                throw Exception(
+                    ErrorCodes::TYPE_MISMATCH,
+                    "Cannot insert NULL value into a column type '{}' at index {}",
+                    data_types[index]->getName(),
+                    index);
+    }
 }
 
 void RowInputFormatWithNamesAndTypes::tryDetectHeader(std::vector<String> & column_names_out, std::vector<String> & type_names_out)
@@ -217,7 +229,15 @@ bool RowInputFormatWithNamesAndTypes::readRow(MutableColumns & columns, RowReadE
             {
                 const auto & rem_column_index = column_mapping->column_indexes_for_input_fields[file_column];
                 if (rem_column_index)
+                {
+                    if (format_settings.force_null_for_omitted_fields && !isNullableOrLowCardinalityNullable(data_types[*rem_column_index]))
+                        throw Exception(
+                            ErrorCodes::TYPE_MISMATCH,
+                            "Cannot insert NULL value into a column type '{}' at index {}",
+                            data_types[*rem_column_index]->getName(),
+                            *rem_column_index);
                     columns[*rem_column_index]->insertDefault();
+                }
                 ++file_column;
             }
             break;
diff --git a/tests/queries/0_stateless/03004_force_null_for_omitted.reference b/tests/queries/0_stateless/03004_force_null_for_omitted.reference
new file mode 100644
index 00000000000..a4c928aae8c
--- /dev/null
+++ b/tests/queries/0_stateless/03004_force_null_for_omitted.reference
@@ -0,0 +1,44 @@
+0	0
+0	0
+2	0
+0	0
+4	0
+0	\N
+0	\N
+2	\N
+0	\N
+4	\N
+0	\N
+0	\N
+2	\N
+0	\N
+4	\N
+0	\N
+0	\N
+2	\N
+0	\N
+4	\N
+0	\N
+0	\N
+2	\N
+0	\N
+4	\N
+0
+0	\N
+1	\N
+1	\N
+1	\N
+1	\N
+1	0
+1	\N
+1	\N
+1	2
+3	0
+1	0
+1	\N
+1	\N
+1	2
+3	0
+1	0
+1	\N
+1	\N
diff --git a/tests/queries/0_stateless/03004_force_null_for_omitted.sql b/tests/queries/0_stateless/03004_force_null_for_omitted.sql
new file mode 100644
index 00000000000..43ba2568acb
--- /dev/null
+++ b/tests/queries/0_stateless/03004_force_null_for_omitted.sql
@@ -0,0 +1,36 @@
+set allow_suspicious_low_cardinality_types = 1;
+insert into function file(concat(currentDatabase(), '.03004_data.bsonEachRow'), auto, 'null Nullable(UInt32)') select number % 2 ? NULL : number from numbers(5) settings engine_file_truncate_on_insert=1;
+select * from file(concat(currentDatabase(), '.03004_data.bsonEachRow'), auto, 'null UInt32, foo UInt32');
+select * from file(concat(currentDatabase(), '.03004_data.bsonEachRow'), auto, 'null UInt32, foo UInt32') settings input_format_force_null_for_omitted_fields = 1; -- { serverError TYPE_MISMATCH }
+select * from file(concat(currentDatabase(), '.03004_data.bsonEachRow'), auto, 'null UInt32, foo Nullable(UInt32)');
+select * from file(concat(currentDatabase(), '.03004_data.bsonEachRow'), auto, 'null UInt32, foo Nullable(UInt32)') settings input_format_force_null_for_omitted_fields = 1;
+select * from file(concat(currentDatabase(), '.03004_data.bsonEachRow'), auto, 'null UInt32, foo LowCardinality(Nullable(UInt32))');
+select * from file(concat(currentDatabase(), '.03004_data.bsonEachRow'), auto, 'null UInt32, foo LowCardinality(Nullable(UInt32))') settings input_format_force_null_for_omitted_fields = 1;
+
+select * from format(JSONEachRow, 'foo UInt32', '{}');
+select * from format(JSONEachRow, 'foo UInt32', '{}') settings input_format_force_null_for_omitted_fields = 1;  -- { serverError TYPE_MISMATCH }
+select * from format(JSONEachRow, 'foo UInt32, bar Nullable(UInt32)', '{}');
+select * from format(JSONEachRow, 'foo UInt32, bar Nullable(UInt32)', '{\"foo\":1}');
+select * from format(JSONEachRow, 'foo UInt32, bar Nullable(UInt32)', '{}') settings input_format_force_null_for_omitted_fields = 1;  -- { serverError TYPE_MISMATCH }
+select * from format(JSONEachRow, 'foo UInt32, bar Nullable(UInt32)', '{\"foo\":1}') settings input_format_force_null_for_omitted_fields = 1;
+select * from format(JSONEachRow, 'foo UInt32, bar LowCardinality(Nullable(UInt32))', '{\"foo\":1}');
+select * from format(JSONEachRow, 'foo UInt32, bar LowCardinality(Nullable(UInt32))', '{\"foo\":1}') settings input_format_force_null_for_omitted_fields = 1;
+
+select * from format(CSVWithNamesAndTypes, 'foo UInt32, bar UInt32', 'foo\nUInt32\n1');
+select * from format(CSVWithNamesAndTypes, 'foo UInt32, bar UInt32', 'foo\nUInt32\n1') settings input_format_force_null_for_omitted_fields = 1;  -- { serverError TYPE_MISMATCH }
+select * from format(CSVWithNamesAndTypes, 'foo UInt32, bar Nullable(UInt32)', 'foo\nUInt32\n1') settings input_format_force_null_for_omitted_fields = 1;
+select * from format(CSVWithNamesAndTypes, 'foo UInt32, bar LowCardinality(Nullable(UInt32))', 'foo\nUInt32\n1') settings input_format_force_null_for_omitted_fields = 1;
+select * from format(CSVWithNamesAndTypes, 'foo UInt32, bar UInt32', 'foo,bar\nUInt32,UInt32\n1,2\n3\n') settings input_format_csv_allow_variable_number_of_columns = 1;
+select * from format(CSVWithNamesAndTypes, 'foo UInt32, bar UInt32', 'foo,bar\nUInt32,UInt32\n1,2\n3\n') settings input_format_csv_allow_variable_number_of_columns = 1, input_format_force_null_for_omitted_fields = 1;  -- { serverError TYPE_MISMATCH }
+
+select * from format(TSVWithNamesAndTypes, 'foo UInt32, bar UInt32', 'foo\nUInt32\n1');
+select * from format(TSVWithNamesAndTypes, 'foo UInt32, bar UInt32', 'foo\nUInt32\n1') settings input_format_force_null_for_omitted_fields = 1;  -- { serverError TYPE_MISMATCH }
+select * from format(TSVWithNamesAndTypes, 'foo UInt32, bar Nullable(UInt32)', 'foo\nUInt32\n1') settings input_format_force_null_for_omitted_fields = 1;
+select * from format(TSVWithNamesAndTypes, 'foo UInt32, bar LowCardinality(Nullable(UInt32))', 'foo\nUInt32\n1') settings input_format_force_null_for_omitted_fields = 1;
+select * from format(TSVWithNamesAndTypes, 'foo UInt32, bar UInt32', 'foo\tbar\nUInt32\tUInt32\n1\t2\n3\n') settings input_format_tsv_allow_variable_number_of_columns = 1;
+select * from format(TSVWithNamesAndTypes, 'foo UInt32, bar UInt32', 'foo\tbar\nUInt32\tUInt32\n1\t2\n3\n') settings input_format_tsv_allow_variable_number_of_columns = 1, input_format_force_null_for_omitted_fields = 1;  -- { serverError TYPE_MISMATCH }
+
+select * from format(TSKV, 'foo UInt32, bar UInt32', 'foo=1\n');
+select * from format(TSKV, 'foo UInt32, bar UInt32', 'foo=1\n') settings input_format_force_null_for_omitted_fields = 1;  -- { serverError TYPE_MISMATCH }
+select * from format(TSKV, 'foo UInt32, bar Nullable(UInt32)', 'foo=1\n') settings input_format_force_null_for_omitted_fields = 1;
+select * from format(TSKV, 'foo UInt32, bar LowCardinality(Nullable(UInt32))', 'foo=1\n') settings input_format_force_null_for_omitted_fields = 1;

From b2377c3fefe8951158de201ea399485f6805f955 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Tue, 7 May 2024 15:31:35 +0000
Subject: [PATCH 124/289] Fix mysql dictionary source

---
 src/Dictionaries/ExternalQueryBuilder.cpp     |  2 +-
 .../test_dictionaries_mysql/test.py           | 38 ++++++++++++++++++-
 2 files changed, 37 insertions(+), 3 deletions(-)

diff --git a/src/Dictionaries/ExternalQueryBuilder.cpp b/src/Dictionaries/ExternalQueryBuilder.cpp
index 792c4e3e907..a31301cd0f3 100644
--- a/src/Dictionaries/ExternalQueryBuilder.cpp
+++ b/src/Dictionaries/ExternalQueryBuilder.cpp
@@ -401,7 +401,7 @@ std::string ExternalQueryBuilder::composeLoadKeysQuery(
         {
             writeString("SELECT * FROM (", out);
             writeString(query, out);
-            writeString(") WHERE ", out);
+            writeString(") AS subquery WHERE ", out);
             composeKeysCondition(key_columns, requested_rows, method, partition_key_prefix, out);
             writeString(";", out);
 
diff --git a/tests/integration/test_dictionaries_mysql/test.py b/tests/integration/test_dictionaries_mysql/test.py
index 360456b2046..332f4ca11bb 100644
--- a/tests/integration/test_dictionaries_mysql/test.py
+++ b/tests/integration/test_dictionaries_mysql/test.py
@@ -76,7 +76,7 @@ def test_mysql_dictionaries_custom_query_full_load(started_cluster):
 
     query = instance.query
     query(
-        """
+        f"""
     CREATE DICTIONARY test_dictionary_custom_query
     (
         id UInt64,
@@ -95,12 +95,46 @@ def test_mysql_dictionaries_custom_query_full_load(started_cluster):
     """
     )
 
-    result = query("SELECT id, value_1, value_2 FROM test_dictionary_custom_query")
+    result = query(
+        "SELECT dictGetString('test_dictionary_custom_query', 'value_1', toUInt64(1))"
+    )
+    assert result == "Value_1\n"
 
+    result = query("SELECT id, value_1, value_2 FROM test_dictionary_custom_query")
     assert result == "1\tValue_1\tValue_2\n"
 
     query("DROP DICTIONARY test_dictionary_custom_query;")
 
+    query(
+        f"""
+    CREATE DICTIONARY test_cache_dictionary_custom_query
+    (
+        id1 UInt64,
+        id2 UInt64,
+        value_concat String
+    )
+    PRIMARY KEY id1, id2
+    LAYOUT(COMPLEX_KEY_CACHE(SIZE_IN_CELLS 10))
+    SOURCE(MYSQL(
+        HOST 'mysql80'
+        PORT 3306
+        USER 'root'
+        PASSWORD 'clickhouse'
+        QUERY 'SELECT id AS id1, id + 1 AS id2, CONCAT_WS(" ", "The", value_1) AS value_concat FROM test.test_table_1'))
+    LIFETIME(0)
+    """
+    )
+
+    result = query(
+        "SELECT dictGetString('test_cache_dictionary_custom_query', 'value_concat', (1, 2))"
+    )
+    assert result == "The Value_1\n"
+
+    result = query("SELECT id1, value_concat FROM test_cache_dictionary_custom_query")
+    assert result == "1\tThe Value_1\n"
+
+    query("DROP DICTIONARY test_cache_dictionary_custom_query;")
+
     execute_mysql_query(mysql_connection, "DROP TABLE test.test_table_1;")
     execute_mysql_query(mysql_connection, "DROP TABLE test.test_table_2;")
 

From 8e072f6b8d567ea82aa0c44bad6f26228b7bb96f Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Tue, 7 May 2024 18:58:51 +0200
Subject: [PATCH 125/289] Newline at the end of .reference

---
 .../queries/0_stateless/03132_pretty_format_break_line.reference | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/03132_pretty_format_break_line.reference b/tests/queries/0_stateless/03132_pretty_format_break_line.reference
index b7b59df24fc..06b17ce4e12 100644
--- a/tests/queries/0_stateless/03132_pretty_format_break_line.reference
+++ b/tests/queries/0_stateless/03132_pretty_format_break_line.reference
@@ -104,4 +104,3 @@ world │ hello world │
 2. │  1 │ hello world │ hellow
 мир   │
    └────┴─────────────┴─────────────┘
-   
\ No newline at end of file

From 836cf150b5b4a9625aee0d440a0d64a966b4c4e0 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 7 May 2024 17:39:04 +0200
Subject: [PATCH 126/289] Fix

---
 src/Disks/StoragePolicy.cpp                   | 13 ++++++----
 .../test_disk_over_web_server/test.py         | 24 +++++++++++++++++++
 2 files changed, 32 insertions(+), 5 deletions(-)

diff --git a/src/Disks/StoragePolicy.cpp b/src/Disks/StoragePolicy.cpp
index 390afb368f8..ccdc34d5d06 100644
--- a/src/Disks/StoragePolicy.cpp
+++ b/src/Disks/StoragePolicy.cpp
@@ -462,15 +462,18 @@ StoragePolicySelectorPtr StoragePolicySelector::updateFromConfig(const Poco::Uti
     /// First pass, check.
     for (const auto & [name, policy] : policies)
     {
-        if (name.starts_with(TMP_STORAGE_POLICY_PREFIX))
-            continue;
+        if (!name.starts_with(TMP_STORAGE_POLICY_PREFIX))
+        {
+            if (!result->policies.contains(name))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Storage policy {} is missing in new configuration", backQuote(name));
 
-        if (!result->policies.contains(name))
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Storage policy {} is missing in new configuration", backQuote(name));
+            policy->checkCompatibleWith(result->policies[name]);
+        }
 
-        policy->checkCompatibleWith(result->policies[name]);
         for (const auto & disk : policy->getDisks())
+        {
             disks_before_reload.insert(disk->getName());
+        }
     }
 
     /// Second pass, load.
diff --git a/tests/integration/test_disk_over_web_server/test.py b/tests/integration/test_disk_over_web_server/test.py
index 8ddc1ff3c31..15b26c6b09e 100644
--- a/tests/integration/test_disk_over_web_server/test.py
+++ b/tests/integration/test_disk_over_web_server/test.py
@@ -40,6 +40,12 @@ def cluster():
             image="clickhouse/clickhouse-server",
             tag=CLICKHOUSE_CI_MIN_TESTED_VERSION,
         )
+        cluster.add_instance(
+            "node5",
+            main_configs=["configs/storage_conf.xml"],
+            with_nginx=True,
+            allow_analyzer=False,
+        )
 
         cluster.start()
 
@@ -390,3 +396,21 @@ def test_page_cache(cluster):
 
         node.query("DROP TABLE test{} SYNC".format(i))
         print(f"Ok {i}")
+
+
+def test_config_reload(cluster):
+    node1 = cluster.instances["node5"]
+    table_name = "config_reload"
+
+    global uuids
+    node1.query(
+        f"""
+        DROP TABLE IF EXISTS {table_name};
+        CREATE TABLE {table_name} UUID '{uuids[0]}'
+        (id Int32) ENGINE = MergeTree() ORDER BY id
+        SETTINGS disk = disk(type=web, endpoint='http://nginx:80/test1/');
+    """
+    )
+
+    node1.query("SYSTEM RELOAD CONFIG")
+    node1.query(f"DROP TABLE {table_name} SYNC")

From 9ecbff2573adc3f335ba60c0a2e487a89339a852 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 7 May 2024 19:03:17 +0200
Subject: [PATCH 127/289] Update 03145_non_loaded_projection_backup.sh

---
 .../0_stateless/03145_non_loaded_projection_backup.sh        | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
index 6f0e00ce3fc..b542c9fff9a 100755
--- a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
+++ b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
@@ -36,6 +36,7 @@ backup table tp_1 to Disk('backups', '$backup_id');
 " | grep -o "BACKUP_CREATED"
 
 $CLICKHOUSE_CLIENT -nm -q "
+set send_logs_level='fatal';
 drop table tp_1;
 restore table tp_1 from Disk('backups', '$backup_id');
 " | grep -o "RESTORED"
@@ -47,4 +48,6 @@ check table tp_1 settings check_query_single_value_result = 0;" | grep -o "Found
 $CLICKHOUSE_CLIENT -nm -q "
 set send_logs_level='fatal';
 check table tp_1"
-$CLICKHOUSE_CLIENT -q "drop table tp_1"
+$CLICKHOUSE_CLIENT -nm -q "
+set send_logs_level='fatal';
+drop table tp_1"

From ed59a5c248e613aeab40f98dfedd2e9cd5c88dee Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Tue, 7 May 2024 19:17:00 +0200
Subject: [PATCH 128/289] Update PrettyBlockOutputFormat.cpp

---
 src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index e23622bc2e5..d84ffe800e7 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -345,7 +345,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
         writeReadableNumberTip(chunk);
         writeCString("\n", out);
 
-        if (has_transferred_row && format_settings.pretty.preserve_border_for_multiline_string)
+        if (has_transferred_row)
             writeTransferredRow(max_widths, header, transferred_row, cut_to_width, false);
     }
 

From cdcdb4cf71420aced463b01869da25be8015b75c Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Tue, 7 May 2024 19:35:09 +0200
Subject: [PATCH 129/289] remove unnecessary checks

---
 src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp       | 4 ++--
 .../Formats/Impl/PrettyCompactBlockOutputFormat.cpp           | 2 +-
 src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp  | 2 +-
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index d84ffe800e7..41c7bfa316b 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -453,7 +453,7 @@ void PrettyBlockOutputFormat::writeValueWithPadding(
         value_width = format_settings.pretty.max_value_width;
         has_break_line = false;
     }
-    else if (!has_break_line || !format_settings.pretty.preserve_border_for_multiline_string)
+    else if (!has_break_line)
         value += ' ';
 
     auto write_padding = [&]()
@@ -478,7 +478,7 @@ void PrettyBlockOutputFormat::writeValueWithPadding(
         write_padding();
     }
 
-    if (has_break_line && format_settings.pretty.preserve_border_for_multiline_string)
+    if (has_break_line)
         writeString("…", out);
 }
 
diff --git a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
index 1ccb6d713d7..ce22a3b2864 100644
--- a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
@@ -194,7 +194,7 @@ void PrettyCompactBlockOutputFormat::writeRow(
     writeReadableNumberTip(chunk);
     writeCString("\n", out);
 
-    if (has_transferred_row && format_settings.pretty.preserve_border_for_multiline_string)
+    if (has_transferred_row)
         writeTransferredRow(max_widths, header, transferred_row, cut_to_width, false);
 }
 
diff --git a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
index 0ed8c4398e4..d311f005173 100644
--- a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
@@ -111,7 +111,7 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
         writeReadableNumberTip(chunk);
         writeChar('\n', out);
 
-        if (has_transferred_row && format_settings.pretty.preserve_border_for_multiline_string)
+        if (has_transferred_row)
             writeTransferredRow(max_widths, header, transferred_row, cut_to_width, true);
     }
 

From a2e9b6f4c61de96a12edee926c757c3d776d01a7 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 7 May 2024 17:42:43 +0000
Subject: [PATCH 130/289] Another attempt.

---
 src/Planner/PlannerExpressionAnalysis.cpp | 49 ++++++++++++++++++++---
 1 file changed, 43 insertions(+), 6 deletions(-)

diff --git a/src/Planner/PlannerExpressionAnalysis.cpp b/src/Planner/PlannerExpressionAnalysis.cpp
index d7fa270a643..6e194b2c03e 100644
--- a/src/Planner/PlannerExpressionAnalysis.cpp
+++ b/src/Planner/PlannerExpressionAnalysis.cpp
@@ -51,6 +51,41 @@ FilterAnalysisResult analyzeFilter(const QueryTreeNodePtr & filter_expression_no
     return result;
 }
 
+bool isDeterministicConstant(const ConstantNode & root)
+{
+    const auto & source_expression = root.getSourceExpression();
+    if (!source_expression)
+        return true;
+
+    std::stack<const IQueryTreeNode *> nodes;
+    nodes.push(source_expression.get());
+    while (!nodes.empty())
+    {
+        const auto * node = nodes.top();
+        nodes.pop();
+
+        const auto * constant_node = node->as<ConstantNode>();
+        const auto * function_node = node->as<FunctionNode>();
+        if (constant_node)
+        {
+            if (!isDeterministicConstant(*constant_node))
+                return false;
+        }
+        else if (function_node)
+        {
+            if (!function_node->getFunctionOrThrow()->isDeterministic())
+                return false;
+
+            for (const auto & child : function_node->getArguments())
+                nodes.push(child.get());
+        }
+        else
+            return false;
+    }
+
+    return true;
+}
+
 /** Construct aggregation analysis result if query tree has GROUP BY or aggregates.
   * Actions before aggregation are added into actions chain, if result is not null optional.
   */
@@ -86,6 +121,8 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
         (query_node.isGroupByWithGroupingSets() || query_node.isGroupByWithRollup() || query_node.isGroupByWithCube());
 
     bool is_secondary_query = planner_context->getQueryContext()->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY;
+    bool is_distributed_query = planner_context->getQueryContext()->isDistributed();
+    bool check_deterministic_constants = is_secondary_query || is_distributed_query;
 
     if (query_node.hasGroupBy())
     {
@@ -99,10 +136,10 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
 
                 for (auto & grouping_set_key_node : grouping_set_keys_list_node_typed.getNodes())
                 {
-                    auto is_constant_key = grouping_set_key_node->as<ConstantNode>() != nullptr;
-                    group_by_with_constant_keys |= is_constant_key;
+                    const auto * constant_key = grouping_set_key_node->as<ConstantNode>();
+                    group_by_with_constant_keys |= (constant_key != nullptr);
 
-                    if (!is_secondary_query && is_constant_key && !aggregates_descriptions.empty())
+                    if (constant_key && !aggregates_descriptions.empty() && (!check_deterministic_constants || isDeterministicConstant(*constant_key)))
                         continue;
 
                     auto expression_dag_nodes = actions_visitor.visit(before_aggregation_actions, grouping_set_key_node);
@@ -151,10 +188,10 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
         {
             for (auto & group_by_key_node : query_node.getGroupBy().getNodes())
             {
-                auto is_constant_key = group_by_key_node->as<ConstantNode>() != nullptr;
-                group_by_with_constant_keys |= is_constant_key;
+                const auto * constant_key = group_by_key_node->as<ConstantNode>();
+                group_by_with_constant_keys |= (constant_key != nullptr);
 
-                if (!is_secondary_query && is_constant_key && !aggregates_descriptions.empty())
+                if (constant_key && !aggregates_descriptions.empty() && (!check_deterministic_constants || isDeterministicConstant(*constant_key)))
                     continue;
 
                 auto expression_dag_nodes = actions_visitor.visit(before_aggregation_actions, group_by_key_node);

From 511146c99c7d0c92802052643ae71e6f3f4c6dad Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Tue, 7 May 2024 19:51:47 +0200
Subject: [PATCH 131/289] Update CHANGELOG.md

---
 CHANGELOG.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 955e2f5b72f..f40c42c4462 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -33,7 +33,6 @@
 * A mode for `topK`/`topkWeighed` support mode, which return count of values and its error. [#54508](https://github.com/ClickHouse/ClickHouse/pull/54508) ([UnamedRus](https://github.com/UnamedRus)).
 * Added function `toMillisecond` which returns the millisecond component for values of type`DateTime` or `DateTime64`. [#60281](https://github.com/ClickHouse/ClickHouse/pull/60281) ([Shaun Struwig](https://github.com/Blargian)).
 * Allow configuring HTTP redirect handlers for clickhouse-server. For example, you can make `/` redirect to the Play UI. [#60390](https://github.com/ClickHouse/ClickHouse/pull/60390) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow Raw as a synonym for TSVRaw. [#63394](https://github.com/ClickHouse/ClickHouse/pull/63394) ([Unalian](https://github.com/Unalian))
 
 #### Performance Improvement
 * Optimized function `dotProduct` to omit unnecessary and expensive memory copies. [#60928](https://github.com/ClickHouse/ClickHouse/pull/60928) ([Robert Schulze](https://github.com/rschu1ze)).

From f52dfd98aa0ff7d1c037da02fdf2cf402e7ad3a6 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 7 May 2024 16:31:21 +0000
Subject: [PATCH 132/289] add test for 49307

---
 .../03148_mutations_virtual_columns.reference    |  1 +
 .../03148_mutations_virtual_columns.sql          | 16 ++++++++++++++++
 2 files changed, 17 insertions(+)
 create mode 100644 tests/queries/0_stateless/03148_mutations_virtual_columns.reference
 create mode 100644 tests/queries/0_stateless/03148_mutations_virtual_columns.sql

diff --git a/tests/queries/0_stateless/03148_mutations_virtual_columns.reference b/tests/queries/0_stateless/03148_mutations_virtual_columns.reference
new file mode 100644
index 00000000000..7c5e8041147
--- /dev/null
+++ b/tests/queries/0_stateless/03148_mutations_virtual_columns.reference
@@ -0,0 +1 @@
+2	all_2_2_0
diff --git a/tests/queries/0_stateless/03148_mutations_virtual_columns.sql b/tests/queries/0_stateless/03148_mutations_virtual_columns.sql
new file mode 100644
index 00000000000..045869b224a
--- /dev/null
+++ b/tests/queries/0_stateless/03148_mutations_virtual_columns.sql
@@ -0,0 +1,16 @@
+DROP TABLE IF EXISTS t_mut_virtuals;
+
+CREATE TABLE t_mut_virtuals (id UInt64, s String) ENGINE = MergeTree ORDER BY id;
+
+INSERT INTO t_mut_virtuals VALUES (1, 'a');
+INSERT INTO t_mut_virtuals VALUES (2, 'b');
+
+SET insert_keeper_fault_injection_probability = 0;
+SET mutations_sync = 2;
+
+ALTER TABLE t_mut_virtuals UPDATE s = _part WHERE 1;
+ALTER TABLE t_mut_virtuals DELETE WHERE _part LIKE 'all_1_1_0%';
+
+SELECT * FROM t_mut_virtuals ORDER BY id;
+
+DROP TABLE t_mut_virtuals;

From 134b468d917fd8b243b5b39e15872057acbc3015 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 7 May 2024 18:14:32 +0000
Subject: [PATCH 133/289] Another case.

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp          | 14 +++++++++-----
 ...3_group_by_use_nulls_analyzer_crashes.reference | 10 ++++++++++
 .../03023_group_by_use_nulls_analyzer_crashes.sql  |  2 ++
 3 files changed, 21 insertions(+), 5 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 80294b7a428..426f3b6bde8 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -4120,8 +4120,8 @@ IdentifierResolveResult QueryAnalyzer::tryResolveIdentifier(const IdentifierLook
              * SELECT id FROM ( SELECT ... ) AS subquery ARRAY JOIN [0] AS id INNER JOIN second_table USING (id)
              * In the example, identifier `id` should be resolved into one from USING (id) column.
              */
-            auto alias_it = scope.alias_name_to_expression_node.find(identifier_lookup.identifier.getFullName());
-            if (alias_it != scope.alias_name_to_expression_node.end() && alias_it->second->getNodeType() == QueryTreeNodeType::COLUMN)
+            auto alias_it = scope.alias_name_to_expression_node->find(identifier_lookup.identifier.getFullName());
+            if (alias_it != scope.alias_name_to_expression_node->end() && alias_it->second->getNodeType() == QueryTreeNodeType::COLUMN)
             {
                 const auto & column_node = alias_it->second->as<ColumnNode &>();
                 if (column_node.getColumnSource()->getNodeType() == QueryTreeNodeType::ARRAY_JOIN)
@@ -5225,8 +5225,12 @@ ProjectionNames QueryAnalyzer::resolveLambda(const QueryTreeNodePtr & lambda_nod
     for (size_t i = 0; i < lambda_arguments_nodes_size; ++i)
     {
         auto & lambda_argument_node = lambda_arguments_nodes[i];
-        auto & lambda_argument_node_typed = lambda_argument_node->as<IdentifierNode &>();
-        const auto & lambda_argument_name = lambda_argument_node_typed.getIdentifier().getFullName();
+        const auto * lambda_argument_identifier = lambda_argument_node->as<IdentifierNode>();
+        const auto * lambda_argument_column = lambda_argument_node->as<ColumnNode>();
+        if (!lambda_argument_identifier && !lambda_argument_column)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected IDENTIFIER or COLUMN as lambda argument, got {}", lambda_node->dumpTree());
+        const auto & lambda_argument_name = lambda_argument_identifier ? lambda_argument_identifier->getIdentifier().getFullName()
+                                                                       : lambda_argument_column->getColumnName();
 
         bool has_expression_node = scope.alias_name_to_expression_node->contains(lambda_argument_name);
         bool has_alias_node = scope.alias_name_to_lambda_node.contains(lambda_argument_name);
@@ -5236,7 +5240,7 @@ ProjectionNames QueryAnalyzer::resolveLambda(const QueryTreeNodePtr & lambda_nod
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                 "Alias name '{}' inside lambda {} cannot have same name as lambda argument. In scope {}",
                 lambda_argument_name,
-                lambda_argument_node_typed.formatASTForErrorMessage(),
+                lambda_argument_node->formatASTForErrorMessage(),
                 scope.scope_node->formatASTForErrorMessage());
         }
 
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
index 0eb9d94e85a..273e1567a9b 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
@@ -86,3 +86,13 @@ a	a
 \N	0	nan
 \N	4	nan
 \N	\N	nan
+[]
+['.']
+['.','.']
+['.','.','.']
+['.','.','.','.']
+['.','.','.','.','.']
+['.','.','.','.','.','.']
+['.','.','.','.','.','.','.']
+['.','.','.','.','.','.','.','.']
+['.','.','.','.','.','.','.','.','.']
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
index 7311ce54e39..bba0a27560f 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
@@ -43,3 +43,5 @@ GROUP BY
     number + number AS b
     WITH CUBE
 SETTINGS group_by_use_nulls = 1;
+
+SELECT arrayMap(x -> '.', range(number % 10)) AS k FROM remote('127.0.0.{2,3}', numbers(10)) GROUP BY GROUPING SETS ((k)) ORDER BY k settings group_by_use_nulls=1;

From 95b76bf6a47f0e23d41ce33c2223cee93066ad3e Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 7 May 2024 20:58:19 +0200
Subject: [PATCH 134/289] Remove leftovers of GCC support in cmake rules

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 CMakeLists.txt                             | 119 +++++++++------------
 cmake/linux/default_libs.cmake             |  16 ++-
 cmake/sanitize.cmake                       |   8 +-
 cmake/tools.cmake                          |  85 +++++----------
 cmake/warnings.cmake                       |  66 ++++++------
 contrib/capnproto-cmake/CMakeLists.txt     |   4 +-
 contrib/openssl-cmake/CMakeLists.txt       |  10 +-
 contrib/sentry-native-cmake/CMakeLists.txt |   2 +-
 8 files changed, 125 insertions(+), 185 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index be804a14765..abbc48ab23a 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -135,23 +135,21 @@ endif ()
 include (cmake/check_flags.cmake)
 include (cmake/add_warning.cmake)
 
-if (COMPILER_CLANG)
-    # generate ranges for fast "addr2line" search
-    if (NOT CMAKE_BUILD_TYPE_UC STREQUAL "RELEASE")
-        # NOTE: that clang has a bug because of it does not emit .debug_aranges
-        # with ThinLTO, so custom ld.lld wrapper is shipped in docker images.
-        set(COMPILER_FLAGS "${COMPILER_FLAGS} -gdwarf-aranges")
-    endif ()
-
-    # See https://blog.llvm.org/posts/2021-04-05-constructor-homing-for-debug-info/
-    if (CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG" OR CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO")
-        set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Xclang -fuse-ctor-homing")
-        set (CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -Xclang -fuse-ctor-homing")
-    endif()
-
-    no_warning(enum-constexpr-conversion) # breaks Protobuf in clang-16
+# generate ranges for fast "addr2line" search
+if (NOT CMAKE_BUILD_TYPE_UC STREQUAL "RELEASE")
+    # NOTE: that clang has a bug because of it does not emit .debug_aranges
+    # with ThinLTO, so custom ld.lld wrapper is shipped in docker images.
+    set(COMPILER_FLAGS "${COMPILER_FLAGS} -gdwarf-aranges")
 endif ()
 
+# See https://blog.llvm.org/posts/2021-04-05-constructor-homing-for-debug-info/
+if (CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG" OR CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO")
+    set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Xclang -fuse-ctor-homing")
+    set (CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -Xclang -fuse-ctor-homing")
+endif()
+
+no_warning(enum-constexpr-conversion) # breaks Protobuf in clang-16
+
 option(ENABLE_TESTS "Provide unit_test_dbms target with Google.Test unit tests" ON)
 option(ENABLE_EXAMPLES "Build all example programs in 'examples' subdirectories" OFF)
 option(ENABLE_BENCHMARKS "Build all benchmark programs in 'benchmarks' subdirectories" OFF)
@@ -284,16 +282,12 @@ endif ()
 
 option (ENABLE_BUILD_PROFILING "Enable profiling of build time" OFF)
 if (ENABLE_BUILD_PROFILING)
-     if (COMPILER_CLANG)
-        set (COMPILER_FLAGS "${COMPILER_FLAGS} -ftime-trace")
+    set (COMPILER_FLAGS "${COMPILER_FLAGS} -ftime-trace")
 
-        if (LINKER_NAME MATCHES "lld")
-            set (CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -Wl,--time-trace")
-            set (CMAKE_MODULE_LINKER_FLAGS "${CMAKE_MODULE_LINKER_FLAGS} -Wl,--time-trace")
-        endif ()
-     else ()
-        message (${RECONFIGURE_MESSAGE_LEVEL} "Build profiling is only available with CLang")
-     endif ()
+    if (LINKER_NAME MATCHES "lld")
+        set (CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -Wl,--time-trace")
+        set (CMAKE_MODULE_LINKER_FLAGS "${CMAKE_MODULE_LINKER_FLAGS} -Wl,--time-trace")
+    endif ()
 endif ()
 
 set (CMAKE_CXX_STANDARD 23)
@@ -304,22 +298,20 @@ set (CMAKE_C_STANDARD 11)
 set (CMAKE_C_EXTENSIONS ON) # required by most contribs written in C
 set (CMAKE_C_STANDARD_REQUIRED ON)
 
-if (COMPILER_CLANG)
-    # Enable C++14 sized global deallocation functions. It should be enabled by setting -std=c++14 but I'm not sure.
-    # See https://reviews.llvm.org/D112921
-    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fsized-deallocation")
+# Enable C++14 sized global deallocation functions. It should be enabled by setting -std=c++14 but I'm not sure.
+# See https://reviews.llvm.org/D112921
+set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fsized-deallocation")
 
-    # falign-functions=32 prevents from random performance regressions with the code change. Thus, providing more stable
-    # benchmarks.
-    set(COMPILER_FLAGS "${COMPILER_FLAGS} -falign-functions=32")
+# falign-functions=32 prevents from random performance regressions with the code change. Thus, providing more stable
+# benchmarks.
+set(COMPILER_FLAGS "${COMPILER_FLAGS} -falign-functions=32")
 
-    if (ARCH_AMD64)
-        # align branches within a 32-Byte boundary to avoid the potential performance loss when code layout change,
-        # which makes benchmark results more stable.
-        set(BRANCHES_WITHIN_32B_BOUNDARIES "-mbranches-within-32B-boundaries")
-        set(COMPILER_FLAGS "${COMPILER_FLAGS} ${BRANCHES_WITHIN_32B_BOUNDARIES}")
-    endif()
-endif ()
+if (ARCH_AMD64)
+    # align branches within a 32-Byte boundary to avoid the potential performance loss when code layout change,
+    # which makes benchmark results more stable.
+    set(BRANCHES_WITHIN_32B_BOUNDARIES "-mbranches-within-32B-boundaries")
+    set(COMPILER_FLAGS "${COMPILER_FLAGS} ${BRANCHES_WITHIN_32B_BOUNDARIES}")
+endif()
 
 # Disable floating-point expression contraction in order to get consistent floating point calculation results across platforms
 set (COMPILER_FLAGS "${COMPILER_FLAGS} -ffp-contract=off")
@@ -348,39 +340,34 @@ set (CMAKE_ASM_FLAGS                     "${CMAKE_ASM_FLAGS} ${COMPILER_FLAGS} $
 set (CMAKE_ASM_FLAGS_RELWITHDEBINFO      "${CMAKE_ASM_FLAGS_RELWITHDEBINFO} -O3 ${DEBUG_INFO_FLAGS} ${CMAKE_ASM_FLAGS_ADD}")
 set (CMAKE_ASM_FLAGS_DEBUG               "${CMAKE_ASM_FLAGS_DEBUG} -O0 ${DEBUG_INFO_FLAGS} ${CMAKE_ASM_FLAGS_ADD}")
 
-if (COMPILER_CLANG)
-    if (OS_DARWIN)
-        set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -stdlib=libc++")
-        set(CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -Wl,-U,_inside_main")
-    endif()
+if (OS_DARWIN)
+    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -stdlib=libc++")
+    set(CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -Wl,-U,_inside_main")
+endif()
 
-    # Display absolute paths in error messages. Otherwise KDevelop fails to navigate to correct file and opens a new file instead.
-    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fdiagnostics-absolute-paths")
-    set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -fdiagnostics-absolute-paths")
+# Display absolute paths in error messages. Otherwise KDevelop fails to navigate to correct file and opens a new file instead.
+set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fdiagnostics-absolute-paths")
+set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -fdiagnostics-absolute-paths")
 
-    if (NOT ENABLE_TESTS AND NOT SANITIZE AND NOT SANITIZE_COVERAGE AND OS_LINUX)
-        # https://clang.llvm.org/docs/ThinLTO.html
-        # Applies to clang and linux only.
-        # Disabled when building with tests or sanitizers.
-        option(ENABLE_THINLTO "Clang-specific link time optimization" ON)
-    endif()
+if (NOT ENABLE_TESTS AND NOT SANITIZE AND NOT SANITIZE_COVERAGE AND OS_LINUX)
+    # https://clang.llvm.org/docs/ThinLTO.html
+    # Applies to clang and linux only.
+    # Disabled when building with tests or sanitizers.
+    option(ENABLE_THINLTO "Clang-specific link time optimization" ON)
+endif()
 
-    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fstrict-vtable-pointers")
-
-    # We cannot afford to use LTO when compiling unit tests, and it's not enough
-    # to only supply -fno-lto at the final linking stage. So we disable it
-    # completely.
-    if (ENABLE_THINLTO AND NOT ENABLE_TESTS AND NOT SANITIZE)
-        # Link time optimization
-        set (CMAKE_C_FLAGS_RELWITHDEBINFO "${CMAKE_C_FLAGS_RELWITHDEBINFO} -flto=thin -fwhole-program-vtables")
-        set (CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS_RELWITHDEBINFO} -flto=thin -fwhole-program-vtables")
-        set (CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO "${CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO} -flto=thin -fwhole-program-vtables")
-    elseif (ENABLE_THINLTO)
-        message (${RECONFIGURE_MESSAGE_LEVEL} "Cannot enable ThinLTO")
-    endif ()
+set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fstrict-vtable-pointers")
 
+# We cannot afford to use LTO when compiling unit tests, and it's not enough
+# to only supply -fno-lto at the final linking stage. So we disable it
+# completely.
+if (ENABLE_THINLTO AND NOT ENABLE_TESTS AND NOT SANITIZE)
+    # Link time optimization
+    set (CMAKE_C_FLAGS_RELWITHDEBINFO "${CMAKE_C_FLAGS_RELWITHDEBINFO} -flto=thin -fwhole-program-vtables")
+    set (CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS_RELWITHDEBINFO} -flto=thin -fwhole-program-vtables")
+    set (CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO "${CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO} -flto=thin -fwhole-program-vtables")
 elseif (ENABLE_THINLTO)
-    message (${RECONFIGURE_MESSAGE_LEVEL} "ThinLTO is only available with Clang")
+    message (${RECONFIGURE_MESSAGE_LEVEL} "Cannot enable ThinLTO")
 endif ()
 
 # Turns on all external libs like s3, kafka, ODBC, ...
diff --git a/cmake/linux/default_libs.cmake b/cmake/linux/default_libs.cmake
index e5ca8e296fc..4a06243243e 100644
--- a/cmake/linux/default_libs.cmake
+++ b/cmake/linux/default_libs.cmake
@@ -5,17 +5,15 @@ set (DEFAULT_LIBS "-nodefaultlibs")
 
 # We need builtins from Clang's RT even without libcxx - for ubsan+int128.
 # See https://bugs.llvm.org/show_bug.cgi?id=16404
-if (COMPILER_CLANG)
-    execute_process (COMMAND ${CMAKE_CXX_COMPILER} --target=${CMAKE_CXX_COMPILER_TARGET} --print-libgcc-file-name --rtlib=compiler-rt OUTPUT_VARIABLE BUILTINS_LIBRARY OUTPUT_STRIP_TRAILING_WHITESPACE)
+execute_process (COMMAND ${CMAKE_CXX_COMPILER} --target=${CMAKE_CXX_COMPILER_TARGET} --print-libgcc-file-name --rtlib=compiler-rt OUTPUT_VARIABLE BUILTINS_LIBRARY OUTPUT_STRIP_TRAILING_WHITESPACE)
 
-    # Apparently, in clang-19, the UBSan support library for C++ was moved out into ubsan_standalone_cxx.a, so we have to include both.
-    if (SANITIZE STREQUAL undefined)
-        string(REPLACE "builtins.a" "ubsan_standalone_cxx.a" EXTRA_BUILTINS_LIBRARY "${BUILTINS_LIBRARY}")
-    endif ()
+# Apparently, in clang-19, the UBSan support library for C++ was moved out into ubsan_standalone_cxx.a, so we have to include both.
+if (SANITIZE STREQUAL undefined)
+    string(REPLACE "builtins.a" "ubsan_standalone_cxx.a" EXTRA_BUILTINS_LIBRARY "${BUILTINS_LIBRARY}")
+endif ()
 
-    if (NOT EXISTS "${BUILTINS_LIBRARY}")
-        set (BUILTINS_LIBRARY "-lgcc")
-    endif ()
+if (NOT EXISTS "${BUILTINS_LIBRARY}")
+    set (BUILTINS_LIBRARY "-lgcc")
 endif ()
 
 if (OS_ANDROID)
diff --git a/cmake/sanitize.cmake b/cmake/sanitize.cmake
index a3523203912..08716c1196b 100644
--- a/cmake/sanitize.cmake
+++ b/cmake/sanitize.cmake
@@ -26,9 +26,7 @@ if (SANITIZE)
 
     elseif (SANITIZE STREQUAL "thread")
         set (TSAN_FLAGS "-fsanitize=thread")
-        if (COMPILER_CLANG)
-            set (TSAN_FLAGS "${TSAN_FLAGS} -fsanitize-ignorelist=${PROJECT_SOURCE_DIR}/tests/tsan_ignorelist.txt")
-        endif()
+        set (TSAN_FLAGS "${TSAN_FLAGS} -fsanitize-ignorelist=${PROJECT_SOURCE_DIR}/tests/tsan_ignorelist.txt")
 
         set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${SAN_FLAGS} ${TSAN_FLAGS}")
         set (CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${SAN_FLAGS} ${TSAN_FLAGS}")
@@ -44,9 +42,7 @@ if (SANITIZE)
             # that's why we often receive reports about UIO. The simplest way to avoid this is just  set this flag here.
             set(UBSAN_FLAGS "${UBSAN_FLAGS} -fno-sanitize=unsigned-integer-overflow")
         endif()
-        if (COMPILER_CLANG)
-            set (UBSAN_FLAGS "${UBSAN_FLAGS} -fsanitize-ignorelist=${PROJECT_SOURCE_DIR}/tests/ubsan_ignorelist.txt")
-        endif()
+        set (UBSAN_FLAGS "${UBSAN_FLAGS} -fsanitize-ignorelist=${PROJECT_SOURCE_DIR}/tests/ubsan_ignorelist.txt")
 
         set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${SAN_FLAGS} ${UBSAN_FLAGS}")
         set (CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${SAN_FLAGS} ${UBSAN_FLAGS}")
diff --git a/cmake/tools.cmake b/cmake/tools.cmake
index 1ba3007b0f3..024505411a3 100644
--- a/cmake/tools.cmake
+++ b/cmake/tools.cmake
@@ -1,10 +1,6 @@
 # Compiler
 
-if (CMAKE_CXX_COMPILER_ID MATCHES "AppleClang")
-    set (COMPILER_CLANG 1) # Safe to treat AppleClang as a regular Clang, in general.
-elseif (CMAKE_CXX_COMPILER_ID MATCHES "Clang")
-    set (COMPILER_CLANG 1)
-else ()
+if (NOT CMAKE_CXX_COMPILER_ID MATCHES "Clang")
     message (FATAL_ERROR "Compiler ${CMAKE_CXX_COMPILER_ID} is not supported")
 endif ()
 
@@ -17,30 +13,26 @@ set (CLANG_MINIMUM_VERSION 16)
 set (XCODE_MINIMUM_VERSION 12.0)
 set (APPLE_CLANG_MINIMUM_VERSION 12.0.0)
 
-if (COMPILER_CLANG)
-    if (CMAKE_CXX_COMPILER_ID MATCHES "AppleClang")
-        # (Experimental!) Specify "-DALLOW_APPLECLANG=ON" when running CMake configuration step, if you want to experiment with using it.
-        if (NOT ALLOW_APPLECLANG AND NOT DEFINED ENV{ALLOW_APPLECLANG})
-            message (FATAL_ERROR "Compilation with AppleClang is unsupported. Please use vanilla Clang, e.g. from Homebrew.")
-        endif ()
+if (CMAKE_CXX_COMPILER_ID MATCHES "AppleClang")
+    # (Experimental!) Specify "-DALLOW_APPLECLANG=ON" when running CMake configuration step, if you want to experiment with using it.
+    if (NOT ALLOW_APPLECLANG AND NOT DEFINED ENV{ALLOW_APPLECLANG})
+        message (FATAL_ERROR "Compilation with AppleClang is unsupported. Please use vanilla Clang, e.g. from Homebrew.")
+    endif ()
 
-        # For a mapping between XCode / AppleClang / vanilla Clang versions, see https://en.wikipedia.org/wiki/Xcode
-        if (CMAKE_CXX_COMPILER_VERSION VERSION_LESS ${APPLE_CLANG_MINIMUM_VERSION})
-            message (FATAL_ERROR "Compilation with AppleClang version ${CMAKE_CXX_COMPILER_VERSION} is unsupported, the minimum required version is ${APPLE_CLANG_MINIMUM_VERSION} (Xcode ${XCODE_MINIMUM_VERSION}).")
-        endif ()
-    else ()
-        if (CMAKE_CXX_COMPILER_VERSION VERSION_LESS ${CLANG_MINIMUM_VERSION})
-            message (FATAL_ERROR "Compilation with Clang version ${CMAKE_CXX_COMPILER_VERSION} is unsupported, the minimum required version is ${CLANG_MINIMUM_VERSION}.")
-        endif ()
+    # For a mapping between XCode / AppleClang / vanilla Clang versions, see https://en.wikipedia.org/wiki/Xcode
+    if (CMAKE_CXX_COMPILER_VERSION VERSION_LESS ${APPLE_CLANG_MINIMUM_VERSION})
+        message (FATAL_ERROR "Compilation with AppleClang version ${CMAKE_CXX_COMPILER_VERSION} is unsupported, the minimum required version is ${APPLE_CLANG_MINIMUM_VERSION} (Xcode ${XCODE_MINIMUM_VERSION}).")
+    endif ()
+else ()
+    if (CMAKE_CXX_COMPILER_VERSION VERSION_LESS ${CLANG_MINIMUM_VERSION})
+        message (FATAL_ERROR "Compilation with Clang version ${CMAKE_CXX_COMPILER_VERSION} is unsupported, the minimum required version is ${CLANG_MINIMUM_VERSION}.")
     endif ()
 endif ()
 
-# Linker
-
 string (REGEX MATCHALL "[0-9]+" COMPILER_VERSION_LIST ${CMAKE_CXX_COMPILER_VERSION})
 list (GET COMPILER_VERSION_LIST 0 COMPILER_VERSION_MAJOR)
 
-# Example values: `lld-10`
+# Linker
 option (LINKER_NAME "Linker name or full path")
 
 if (LINKER_NAME MATCHES "gold")
@@ -48,19 +40,15 @@ if (LINKER_NAME MATCHES "gold")
 endif ()
 
 if (NOT LINKER_NAME)
-    if (COMPILER_CLANG)
-        if (OS_LINUX AND NOT ARCH_S390X)
-            find_program (LLD_PATH NAMES "ld.lld-${COMPILER_VERSION_MAJOR}" "ld.lld")
-        elseif (OS_DARWIN)
-            find_program (LLD_PATH NAMES "ld")
-        endif ()
+    if (OS_LINUX AND NOT ARCH_S390X)
+        find_program (LLD_PATH NAMES "ld.lld-${COMPILER_VERSION_MAJOR}" "ld.lld")
+    elseif (OS_DARWIN)
+        find_program (LLD_PATH NAMES "ld")
     endif ()
     if (LLD_PATH)
         if (OS_LINUX OR OS_DARWIN)
-            if (COMPILER_CLANG)
-                # Clang driver simply allows full linker path.
-                set (LINKER_NAME ${LLD_PATH})
-            endif ()
+            # Clang driver simply allows full linker path.
+            set (LINKER_NAME ${LLD_PATH})
         endif ()
     endif()
 endif()
@@ -82,47 +70,28 @@ else ()
 endif ()
 
 # Archiver
-
-if (COMPILER_CLANG)
-    find_program (LLVM_AR_PATH NAMES "llvm-ar-${COMPILER_VERSION_MAJOR}" "llvm-ar")
-endif ()
-
+find_program (LLVM_AR_PATH NAMES "llvm-ar-${COMPILER_VERSION_MAJOR}" "llvm-ar")
 if (LLVM_AR_PATH)
     set (CMAKE_AR "${LLVM_AR_PATH}")
 endif ()
-
 message(STATUS "Using archiver: ${CMAKE_AR}")
 
 # Ranlib
-
-if (COMPILER_CLANG)
-    find_program (LLVM_RANLIB_PATH NAMES "llvm-ranlib-${COMPILER_VERSION_MAJOR}" "llvm-ranlib")
-endif ()
-
+find_program (LLVM_RANLIB_PATH NAMES "llvm-ranlib-${COMPILER_VERSION_MAJOR}" "llvm-ranlib")
 if (LLVM_RANLIB_PATH)
     set (CMAKE_RANLIB "${LLVM_RANLIB_PATH}")
 endif ()
-
 message(STATUS "Using ranlib: ${CMAKE_RANLIB}")
 
 # Install Name Tool
-
-if (COMPILER_CLANG)
-    find_program (LLVM_INSTALL_NAME_TOOL_PATH NAMES "llvm-install-name-tool-${COMPILER_VERSION_MAJOR}" "llvm-install-name-tool")
-endif ()
-
+find_program (LLVM_INSTALL_NAME_TOOL_PATH NAMES "llvm-install-name-tool-${COMPILER_VERSION_MAJOR}" "llvm-install-name-tool")
 if (LLVM_INSTALL_NAME_TOOL_PATH)
     set (CMAKE_INSTALL_NAME_TOOL "${LLVM_INSTALL_NAME_TOOL_PATH}")
 endif ()
-
 message(STATUS "Using install-name-tool: ${CMAKE_INSTALL_NAME_TOOL}")
 
 # Objcopy
-
-if (COMPILER_CLANG)
-    find_program (OBJCOPY_PATH NAMES "llvm-objcopy-${COMPILER_VERSION_MAJOR}" "llvm-objcopy" "objcopy")
-endif ()
-
+find_program (OBJCOPY_PATH NAMES "llvm-objcopy-${COMPILER_VERSION_MAJOR}" "llvm-objcopy" "objcopy")
 if (OBJCOPY_PATH)
     message (STATUS "Using objcopy: ${OBJCOPY_PATH}")
 else ()
@@ -130,11 +99,7 @@ else ()
 endif ()
 
 # Strip
-
-if (COMPILER_CLANG)
-    find_program (STRIP_PATH NAMES "llvm-strip-${COMPILER_VERSION_MAJOR}" "llvm-strip" "strip")
-endif ()
-
+find_program (STRIP_PATH NAMES "llvm-strip-${COMPILER_VERSION_MAJOR}" "llvm-strip" "strip")
 if (STRIP_PATH)
     message (STATUS "Using strip: ${STRIP_PATH}")
 else ()
diff --git a/cmake/warnings.cmake b/cmake/warnings.cmake
index 455e4f09939..807d92d9077 100644
--- a/cmake/warnings.cmake
+++ b/cmake/warnings.cmake
@@ -15,37 +15,35 @@ if ((NOT CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG") AND (NOT SANITIZE) AND (NOT CMAKE
     add_warning(frame-larger-than=65536)
 endif ()
 
-if (COMPILER_CLANG)
-    # Add some warnings that are not available even with -Wall -Wextra -Wpedantic.
-    # We want to get everything out of the compiler for code quality.
-    add_warning(everything)
-    add_warning(pedantic)
-    no_warning(zero-length-array)
-    no_warning(c++98-compat-pedantic)
-    no_warning(c++98-compat)
-    no_warning(c++20-compat) # Use constinit in C++20 without warnings
-    no_warning(sign-conversion)
-    no_warning(implicit-int-conversion)
-    no_warning(implicit-int-float-conversion)
-    no_warning(ctad-maybe-unsupported) # clang 9+, linux-only
-    no_warning(disabled-macro-expansion)
-    no_warning(documentation-unknown-command)
-    no_warning(double-promotion)
-    no_warning(exit-time-destructors)
-    no_warning(float-equal)
-    no_warning(global-constructors)
-    no_warning(missing-prototypes)
-    no_warning(missing-variable-declarations)
-    no_warning(padded)
-    no_warning(switch-enum)
-    no_warning(undefined-func-template)
-    no_warning(unused-template)
-    no_warning(vla)
-    no_warning(weak-template-vtables)
-    no_warning(weak-vtables)
-    no_warning(thread-safety-negative) # experimental flag, too many false positives
-    no_warning(enum-constexpr-conversion) # breaks magic-enum library in clang-16
-    no_warning(unsafe-buffer-usage) # too aggressive
-    no_warning(switch-default) # conflicts with "defaults in a switch covering all enum values"
-    # TODO Enable conversion, sign-conversion, double-promotion warnings.
-endif ()
+# Add some warnings that are not available even with -Wall -Wextra -Wpedantic.
+# We want to get everything out of the compiler for code quality.
+add_warning(everything)
+add_warning(pedantic)
+no_warning(zero-length-array)
+no_warning(c++98-compat-pedantic)
+no_warning(c++98-compat)
+no_warning(c++20-compat) # Use constinit in C++20 without warnings
+no_warning(sign-conversion)
+no_warning(implicit-int-conversion)
+no_warning(implicit-int-float-conversion)
+no_warning(ctad-maybe-unsupported) # clang 9+, linux-only
+no_warning(disabled-macro-expansion)
+no_warning(documentation-unknown-command)
+no_warning(double-promotion)
+no_warning(exit-time-destructors)
+no_warning(float-equal)
+no_warning(global-constructors)
+no_warning(missing-prototypes)
+no_warning(missing-variable-declarations)
+no_warning(padded)
+no_warning(switch-enum)
+no_warning(undefined-func-template)
+no_warning(unused-template)
+no_warning(vla)
+no_warning(weak-template-vtables)
+no_warning(weak-vtables)
+no_warning(thread-safety-negative) # experimental flag, too many false positives
+no_warning(enum-constexpr-conversion) # breaks magic-enum library in clang-16
+no_warning(unsafe-buffer-usage) # too aggressive
+no_warning(switch-default) # conflicts with "defaults in a switch covering all enum values"
+# TODO Enable conversion, sign-conversion, double-promotion warnings.
diff --git a/contrib/capnproto-cmake/CMakeLists.txt b/contrib/capnproto-cmake/CMakeLists.txt
index e76268592ee..c07e9e6925b 100644
--- a/contrib/capnproto-cmake/CMakeLists.txt
+++ b/contrib/capnproto-cmake/CMakeLists.txt
@@ -81,9 +81,7 @@ set (CAPNPC_SRCS
 add_library(_capnpc ${CAPNPC_SRCS})
 target_link_libraries(_capnpc PUBLIC _capnp)
 
-if (COMPILER_CLANG)
-    set (CAPNP_PRIVATE_CXX_FLAGS -fno-char8_t)
-endif ()
+set (CAPNP_PRIVATE_CXX_FLAGS -fno-char8_t)
 
 target_compile_options(_kj PRIVATE ${CAPNP_PRIVATE_CXX_FLAGS})
 target_compile_options(_capnp PRIVATE ${CAPNP_PRIVATE_CXX_FLAGS})
diff --git a/contrib/openssl-cmake/CMakeLists.txt b/contrib/openssl-cmake/CMakeLists.txt
index 021c88bcb04..72846143b9e 100644
--- a/contrib/openssl-cmake/CMakeLists.txt
+++ b/contrib/openssl-cmake/CMakeLists.txt
@@ -91,12 +91,10 @@ set(LIB_SOVERSION ${VERSION_MAJOR})
 
 enable_language(ASM)
 
-if(COMPILER_CLANG)
-    add_definitions(-Wno-unused-command-line-argument)
-    # Note that s390x build uses mold linker
-    if(NOT ARCH_S390X)
-        set(CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} -fuse-ld=lld") # only relevant for -DENABLE_OPENSSL_DYNAMIC=1
-    endif()
+add_definitions(-Wno-unused-command-line-argument)
+# Note that s390x build uses mold linker
+if(NOT ARCH_S390X)
+    set(CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} -fuse-ld=lld") # only relevant for -DENABLE_OPENSSL_DYNAMIC=1
 endif()
 
 if(ARCH_AMD64)
diff --git a/contrib/sentry-native-cmake/CMakeLists.txt b/contrib/sentry-native-cmake/CMakeLists.txt
index 6364e75db28..6e4c8c36081 100644
--- a/contrib/sentry-native-cmake/CMakeLists.txt
+++ b/contrib/sentry-native-cmake/CMakeLists.txt
@@ -1,4 +1,4 @@
-if (NOT OS_FREEBSD AND NOT (OS_DARWIN AND COMPILER_CLANG))
+if (NOT OS_FREEBSD AND NOT OS_DARWIN)
     option (ENABLE_SENTRY "Enable Sentry" ${ENABLE_LIBRARIES})
 else()
     option (ENABLE_SENTRY "Enable Sentry" OFF)

From f45e032715dcc04d3ef78d84750c0f5f835b5008 Mon Sep 17 00:00:00 2001
From: Yohann Jardin <yohann.jardin@telecomnancy.net>
Date: Tue, 7 May 2024 21:11:04 +0200
Subject: [PATCH 135/289] fix errorCodes in stateless tests

---
 tests/queries/0_stateless/00727_concat.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/00727_concat.sql b/tests/queries/0_stateless/00727_concat.sql
index f5048dcaaae..01792545b5a 100644
--- a/tests/queries/0_stateless/00727_concat.sql
+++ b/tests/queries/0_stateless/00727_concat.sql
@@ -93,4 +93,4 @@ SELECT concat(materialize(NULL :: Nullable(UInt64)));
 
 SELECT CONCAT('Testing the ', 'alias');
 
-SELECT concat();  -- { serverError 42 }
+SELECT concat();  -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }

From 577dccd47ff70af55140b673a436354d289c1344 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 7 May 2024 21:09:19 +0200
Subject: [PATCH 136/289] Fix ProfileEventTimeIncrement code

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Common/ElapsedTimeProfileEventIncrement.h | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/src/Common/ElapsedTimeProfileEventIncrement.h b/src/Common/ElapsedTimeProfileEventIncrement.h
index 731295a4cfd..aa944beeaa9 100644
--- a/src/Common/ElapsedTimeProfileEventIncrement.h
+++ b/src/Common/ElapsedTimeProfileEventIncrement.h
@@ -17,19 +17,18 @@ enum Time
 template <Time unit>
 struct ProfileEventTimeIncrement
 {
-    explicit ProfileEventTimeIncrement<time>(ProfileEvents::Event event_)
+    explicit ProfileEventTimeIncrement(ProfileEvents::Event event_)
         : event(event_), watch(CLOCK_MONOTONIC) {}
 
-    template <Time time = unit>
     UInt64 elapsed()
     {
-        if constexpr (time == Time::Nanoseconds)
+        if constexpr (unit == Time::Nanoseconds)
             return watch.elapsedNanoseconds();
-        else if constexpr (time == Time::Microseconds)
+        else if constexpr (unit == Time::Microseconds)
             return watch.elapsedMicroseconds();
-        else if constexpr (time == Time::Milliseconds)
+        else if constexpr (unit == Time::Milliseconds)
             return watch.elapsedMilliseconds();
-        else if constexpr (time == Time::Seconds)
+        else if constexpr (unit == Time::Seconds)
             return watch.elapsedSeconds();
     }
 

From e038d6a47d492e50b5f4c7635639fce0750cf885 Mon Sep 17 00:00:00 2001
From: Volodya <vova.giro2000@gmail.com>
Date: Tue, 7 May 2024 20:05:04 +0000
Subject: [PATCH 137/289] Tabs in pretty format

---
 .../Formats/Impl/PrettyBlockOutputFormat.cpp  | 27 ++++---
 .../Formats/Impl/PrettyBlockOutputFormat.h    |  4 +-
 .../Impl/PrettyCompactBlockOutputFormat.cpp   | 10 ++-
 .../Impl/PrettySpaceBlockOutputFormat.cpp     |  9 ++-
 .../03148_tabs_in_pretty_format.reference     | 72 +++++++++++++++++++
 .../03148_tabs_in_pretty_format.sql           | 42 +++++++++++
 6 files changed, 146 insertions(+), 18 deletions(-)
 create mode 100644 tests/queries/0_stateless/03148_tabs_in_pretty_format.reference
 create mode 100644 tests/queries/0_stateless/03148_tabs_in_pretty_format.sql

diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index 178d0b912e1..6b46d336201 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -24,7 +24,7 @@ PrettyBlockOutputFormat::PrettyBlockOutputFormat(
 /// Note that number of code points is just a rough approximation of visible string width.
 void PrettyBlockOutputFormat::calculateWidths(
     const Block & header, const Chunk & chunk,
-    WidthsPerColumn & widths, Widths & max_padded_widths, Widths & name_widths)
+    WidthsPerColumn & widths, Widths & max_padded_widths, Widths & name_widths, size_t table_border_width)
 {
     size_t num_rows = std::min(chunk.getNumRows(), format_settings.pretty.max_rows);
 
@@ -42,7 +42,7 @@ void PrettyBlockOutputFormat::calculateWidths(
 
     /// Calculate widths of all values.
     String serialized_value;
-    size_t prefix = 2; // Tab character adjustment
+    size_t prefix = format_settings.pretty.output_format_pretty_row_numbers ? row_number_width + table_border_width : table_border_width; // Tab character adjustment
     for (size_t i = 0; i < num_columns; ++i)
     {
         const auto & elem = header.getByPosition(i);
@@ -187,7 +187,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
     WidthsPerColumn widths;
     Widths max_widths;
     Widths name_widths;
-    calculateWidths(header, chunk, widths, max_widths, name_widths);
+    calculateWidths(header, chunk, widths, max_widths, name_widths, 2);
 
     const GridSymbols & grid_symbols = format_settings.pretty.charset == FormatSettings::Pretty::Charset::UTF8 ?
                                        utf8_grid_symbols :
@@ -321,6 +321,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
 
         std::vector<String> transferred_row(num_columns);
         bool has_transferred_row = false;
+        size_t prefix = format_settings.pretty.output_format_pretty_row_numbers ? row_number_width + 2 : 2;
 
         for (size_t j = 0; j < num_columns; ++j)
         {
@@ -334,11 +335,13 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
                 serializations[j]->serializeText(*columns[j], i, out_serialize, format_settings);
             }
             if (cut_to_width)
-                splitValueAtBreakLine(serialized_value, transferred_row[j], cur_width);
-            has_transferred_row |= !transferred_row[j].empty() && cur_width <= cut_to_width;
+                splitValueAtBreakLine(serialized_value, transferred_row[j], cur_width, cut_to_width, prefix);
+            has_transferred_row |= !transferred_row[j].empty();
 
             writeValueWithPadding(serialized_value, cur_width, max_widths[j], cut_to_width,
                 type.shouldAlignRightInPrettyFormats(), isNumber(type), !transferred_row[j].empty(), false);
+
+            prefix += max_widths[j] + 3;
         }
 
         writeCString(grid_symbols.bar, out);
@@ -499,6 +502,7 @@ void PrettyBlockOutputFormat::writeTransferredRow(const Widths & max_widths, con
 
     std::vector<String> new_transferred_row(num_columns);
     bool has_transferred_row = false;
+    size_t prefix = format_settings.pretty.output_format_pretty_row_numbers ? row_number_width + 2 : 2;
 
     for (size_t j = 0; j < num_columns; ++j)
     {
@@ -510,11 +514,13 @@ void PrettyBlockOutputFormat::writeTransferredRow(const Widths & max_widths, con
         const auto & type = *header.getByPosition(j).type;
         size_t cur_width = UTF8::computeWidth(reinterpret_cast<const UInt8 *>(transferred_row[j].data()), transferred_row[j].size());
         if (cut_to_width)
-            splitValueAtBreakLine(transferred_row[j], new_transferred_row[j], cur_width);
-        has_transferred_row |= !new_transferred_row[j].empty() && cur_width <= cut_to_width;
+            splitValueAtBreakLine(transferred_row[j], new_transferred_row[j], cur_width, cut_to_width, prefix);
+        has_transferred_row |= !new_transferred_row[j].empty();
 
         writeValueWithPadding(transferred_row[j], cur_width, max_widths[j], cut_to_width,
             type.shouldAlignRightInPrettyFormats(), isNumber(type), !new_transferred_row[j].empty(), !transferred_row[j].empty());
+
+        prefix += max_widths[j] + 3;
     }
 
     if (!space_block)
@@ -525,13 +531,14 @@ void PrettyBlockOutputFormat::writeTransferredRow(const Widths & max_widths, con
         writeTransferredRow(max_widths, header, new_transferred_row, cut_to_width, space_block);
 }
 
-void PrettyBlockOutputFormat::splitValueAtBreakLine(String & value, String & transferred_value, size_t & value_width)
+void PrettyBlockOutputFormat::splitValueAtBreakLine(String & value, String & transferred_value, size_t & value_width, size_t cut_to_width, size_t prefix)
 {
     if (size_t break_line_pos = value.find_first_of('\n'); break_line_pos != String::npos)
     {
-        transferred_value = value.substr(break_line_pos + 1);
+        value_width = UTF8::computeWidth(reinterpret_cast<const UInt8 *>(value.data()), break_line_pos, prefix);
+        if (value_width <= cut_to_width)
+            transferred_value = value.substr(break_line_pos + 1);
         value = value.substr(0, break_line_pos);
-        value_width = UTF8::computeWidth(reinterpret_cast<const UInt8 *>(value.data()), value.size());
     }
 }
 
diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
index 6673c61c61b..d8309fd2637 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
@@ -44,7 +44,7 @@ protected:
 
     void calculateWidths(
         const Block & header, const Chunk & chunk,
-        WidthsPerColumn & widths, Widths & max_padded_widths, Widths & name_widths);
+        WidthsPerColumn & widths, Widths & max_padded_widths, Widths & name_widths, size_t table_border_width);
 
     void writeValueWithPadding(
         String & value, size_t value_width, size_t pad_to_width, size_t cut_to_width,
@@ -52,7 +52,7 @@ protected:
 
     void writeTransferredRow(const Widths & max_widths, const Block & header, std::vector<String> & transferred_row, size_t cut_to_width, bool space_block);
 
-    void splitValueAtBreakLine(String & value, String & transferred_value, size_t & value_width);
+    void splitValueAtBreakLine(String & value, String & transferred_value, size_t & value_width, size_t cut_to_width, size_t prefix);
 
     void resetFormatterImpl() override
     {
diff --git a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
index 345b6c84ecd..e7391f6c9a3 100644
--- a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
@@ -170,6 +170,8 @@ void PrettyCompactBlockOutputFormat::writeRow(
 
     std::vector<String> transferred_row(num_columns);
     bool has_transferred_row = false;
+    size_t prefix = format_settings.pretty.output_format_pretty_row_numbers ? row_number_width + 2 : 2;
+
     for (size_t j = 0; j < num_columns; ++j)
     {
         if (j != 0)
@@ -183,11 +185,13 @@ void PrettyCompactBlockOutputFormat::writeRow(
             serializations[j]->serializeText(*columns[j], row_num, out_serialize, format_settings);
         }
         if (cut_to_width)
-            splitValueAtBreakLine(serialized_value, transferred_row[j], cur_width);
-        has_transferred_row |= !transferred_row[j].empty() && cur_width <= cut_to_width;
+            splitValueAtBreakLine(serialized_value, transferred_row[j], cur_width, cut_to_width, prefix);
+        has_transferred_row |= !transferred_row[j].empty();
 
         writeValueWithPadding(serialized_value, cur_width, max_widths[j], cut_to_width,
             type.shouldAlignRightInPrettyFormats(), isNumber(type), !transferred_row[j].empty(), false);
+
+        prefix += max_widths[j] + 3;
     }
 
     writeCString(grid_symbols.bar, out);
@@ -208,7 +212,7 @@ void PrettyCompactBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind po
     WidthsPerColumn widths;
     Widths max_widths;
     Widths name_widths;
-    calculateWidths(header, chunk, widths, max_widths, name_widths);
+    calculateWidths(header, chunk, widths, max_widths, name_widths, 2);
 
     writeHeader(header, max_widths, name_widths);
 
diff --git a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
index 6940c20e25b..a70188cd644 100644
--- a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
@@ -31,7 +31,7 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
     WidthsPerColumn widths;
     Widths max_widths;
     Widths name_widths;
-    calculateWidths(header, chunk, widths, max_widths, name_widths);
+    calculateWidths(header, chunk, widths, max_widths, name_widths, 1);
 
     if (format_settings.pretty.output_format_pretty_row_numbers)
         writeString(String(row_number_width, ' '), out);
@@ -88,6 +88,7 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
                 writeCString("\033[0m", out);
 
         }
+        size_t prefix = format_settings.pretty.output_format_pretty_row_numbers ? row_number_width + 1 : 1;
         for (size_t column = 0; column < num_columns; ++column)
         {
             if (column != 0)
@@ -101,11 +102,13 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
                 serializations[column]->serializeText(*columns[column], row, out_serialize, format_settings);
             }
             if (cut_to_width)
-                splitValueAtBreakLine(serialized_value, transferred_row[column], cur_width);
-            has_transferred_row |= !transferred_row[column].empty() && cur_width <= cut_to_width;
+                splitValueAtBreakLine(serialized_value, transferred_row[column], cur_width, cur_width, prefix);
+            has_transferred_row |= !transferred_row[column].empty();
 
             writeValueWithPadding(serialized_value, cur_width, max_widths[column], cut_to_width,
                 type.shouldAlignRightInPrettyFormats(), isNumber(type), !transferred_row[column].empty(), false);
+
+            prefix += max_widths[column] + 3;
         }
 
         writeReadableNumberTip(chunk);
diff --git a/tests/queries/0_stateless/03148_tabs_in_pretty_format.reference b/tests/queries/0_stateless/03148_tabs_in_pretty_format.reference
new file mode 100644
index 00000000000..a0f32016d85
--- /dev/null
+++ b/tests/queries/0_stateless/03148_tabs_in_pretty_format.reference
@@ -0,0 +1,72 @@
+┏━━━━┳━━━━━━━━━━━┳━━━━━━━━━━━━━━━━┓
+┃ id ┃ value     ┃ value1         ┃
+┡━━━━╇━━━━━━━━━━━╇━━━━━━━━━━━━━━━━┩
+│  0 │ test test │ 	something │
+└────┴───────────┴────────────────┘
+   ┏━━━━┳━━━━━━━━━━━┳━━━━━━━━━━━━━┓
+   ┃ id ┃ value     ┃ value1      ┃
+   ┡━━━━╇━━━━━━━━━━━╇━━━━━━━━━━━━━┩
+1. │  0 │ test test │ 	something │
+   └────┴───────────┴─────────────┘
+┌─id─┬─value─┬─value1────┐
+│  0 │ test …│ something │
+│    │…	test │           │
+└────┴───────┴───────────┘
+   ┌─id─┬─value──────┬─value1────┐
+1. │  0 │ test      …│ something │
+   │    │…	test │           │
+   └────┴────────────┴───────────┘
+ id   value    value1   
+
+  0   test  …  something 
+     …	test             
+    id   value         value1   
+
+1.   0   test       …  something 
+        …	test             
+┌─id─┬─value─────┬─value1────┐
+│  0 │ something │ test     …│
+│    │           │…	test │
+└────┴───────────┴───────────┘
+   ┌─id─┬─value─────┬─value1─┐
+1. │  0 │ something │ test  …│
+   │    │           │…	test │
+   └────┴───────────┴────────┘
+ id   value       value1    
+
+  0   something   test      …
+                 …	test 
+    id   value       value1 
+
+1.   0   something   test   …
+                    …	test 
+┏━━━━┳━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━┓
+┃ id ┃ value             ┃ value1    ┃
+┡━━━━╇━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━┩
+│  0 │ something         │ test     …│
+│    │                   │…	test │
+├────┼───────────────────┼───────────┤
+│  1 │ 	some	thing	 │ test     …│
+│    │                   │…	test │
+└────┴───────────────────┴───────────┘
+   ┏━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━┓
+   ┃ id ┃ value                  ┃ value1    ┃
+   ┡━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━┩
+1. │  0 │ something              │ test     …│
+   │    │                        │…	test │
+   ├────┼────────────────────────┼───────────┤
+2. │  1 │ 	some	thing	 │ test     …│
+   │    │                        │…	test │
+   └────┴────────────────────────┴───────────┘
+┏━━━━┳━━━━━━━┳━━━━━━━━┓
+┃ id ┃ value ┃ value1 ┃
+┡━━━━╇━━━━━━━╇━━━━━━━━┩
+│  0 │ somet⋯│ test  …│
+│    │       │…testt⋯ │
+└────┴───────┴────────┘
+   ┏━━━━┳━━━━━━━┳━━━━━━━━┓
+   ┃ id ┃ value ┃ value1 ┃
+   ┡━━━━╇━━━━━━━╇━━━━━━━━┩
+1. │  0 │ somet⋯│ test  …│
+   │    │       │…testt⋯ │
+   └────┴───────┴────────┘
diff --git a/tests/queries/0_stateless/03148_tabs_in_pretty_format.sql b/tests/queries/0_stateless/03148_tabs_in_pretty_format.sql
new file mode 100644
index 00000000000..161cf6304f6
--- /dev/null
+++ b/tests/queries/0_stateless/03148_tabs_in_pretty_format.sql
@@ -0,0 +1,42 @@
+DROP TABLE IF EXISTS t_tabs;
+
+CREATE TABLE t_tabs (id UInt64, value String, value1 String) ENGINE=MergeTree ORDER BY id;
+
+INSERT INTO t_tabs VALUES(0, 'test test', '\tsomething');
+
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyMonoBlock SETTINGS output_format_pretty_row_numbers = 0;
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyMonoBlock;
+
+TRUNCATE TABLE t_tabs;
+
+INSERT INTO t_tabs VALUES(0, 'test\n\ttest', 'something');
+
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyCompactNoEscapes SETTINGS output_format_pretty_row_numbers = 0;
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyCompactNoEscapes;
+SELECT * FROM t_tabs FORMAT PrettySpace SETTINGS output_format_pretty_row_numbers = 0;
+SELECT * FROM t_tabs FORMAT PrettySpace;
+
+TRUNCATE TABLE t_tabs;
+
+INSERT INTO t_tabs VALUES(0, 'something', 'test\n\ttest');
+
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyCompactNoEscapes SETTINGS output_format_pretty_row_numbers = 0;
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyCompactNoEscapes;
+SELECT * FROM t_tabs FORMAT PrettySpace SETTINGS output_format_pretty_row_numbers = 0;
+SELECT * FROM t_tabs FORMAT PrettySpace;
+
+INSERT INTO t_tabs VALUES(1, '\tsome\tthing\t', 'test\n\ttest');
+
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyMonoBlock SETTINGS output_format_pretty_row_numbers = 0;
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyMonoBlock;
+
+TRUNCATE TABLE t_tabs;
+
+SET output_format_pretty_max_value_width = 5;
+
+INSERT INTO t_tabs VALUES(0, 'someth\ning\t', 'test\ntesttest');
+
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyMonoBlock SETTINGS output_format_pretty_row_numbers = 0;
+SELECT * FROM t_tabs ORDER BY id FORMAT PrettyMonoBlock;
+
+DROP TABLE t_tabs;

From 4018a2b4a38bd5b0250a42635f2c669561df204b Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Tue, 7 May 2024 23:43:40 +0300
Subject: [PATCH 138/289] fixed comments

---
 src/Interpreters/HashJoin.cpp            | 13 +++++++--
 src/Interpreters/TemporaryDataOnDisk.cpp | 23 +++++-----------
 src/Interpreters/TemporaryDataOnDisk.h   | 34 ++++++++++++------------
 3 files changed, 35 insertions(+), 35 deletions(-)

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index f4408271fbf..55c2be7d5db 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -36,6 +36,7 @@
 #include <Common/assert_cast.h>
 #include <Common/formatReadable.h>
 #include "Core/Joins.h"
+#include "Interpreters/TemporaryDataOnDisk.h"
 
 #include <Functions/FunctionHelpers.h>
 #include <Interpreters/castColumn.h>
@@ -64,7 +65,7 @@ struct NotProcessedCrossJoin : public ExtraBlock
 {
     size_t left_position;
     size_t right_block;
-    std::unique_ptr<InputReader> reader;
+    std::unique_ptr<TemporaryFileStream::Reader> reader;
 };
 
 
@@ -2260,7 +2261,7 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
 {
     size_t start_left_row = 0;
     size_t start_right_block = 0;
-    std::unique_ptr<InputReader> reader = nullptr;
+    std::unique_ptr<TemporaryFileStream::Reader> reader = nullptr;
     if (not_processed)
     {
         auto & continuation = static_cast<NotProcessedCrossJoin &>(*not_processed);
@@ -2322,6 +2323,10 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
 
         for (const Block & compressed_block_right : data->blocks)
         {
+            if (rows_added > max_joined_block_rows)
+            {
+                break;
+            }
             auto block_right = compressed_block_right.decompress();
             process_right_block(block_right);
         }
@@ -2335,6 +2340,10 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
             }
             while (auto block_right = reader->read())
             {
+                if (rows_added > max_joined_block_rows)
+                {
+                    break;
+                }
                 process_right_block(block_right);
             }
         }
diff --git a/src/Interpreters/TemporaryDataOnDisk.cpp b/src/Interpreters/TemporaryDataOnDisk.cpp
index 9bd0fa9e8ed..a74b5bba2b9 100644
--- a/src/Interpreters/TemporaryDataOnDisk.cpp
+++ b/src/Interpreters/TemporaryDataOnDisk.cpp
@@ -224,7 +224,7 @@ struct TemporaryFileStream::OutputWriter
     bool finalized = false;
 };
 
-InputReader::InputReader(const String & path, const Block & header_, size_t size)
+TemporaryFileStream::Reader::Reader(const String & path, const Block & header_, size_t size)
     : in_file_buf(path, size ? std::min<size_t>(DBMS_DEFAULT_BUFFER_SIZE, size) : DBMS_DEFAULT_BUFFER_SIZE)
     , in_compressed_buf(in_file_buf)
     , in_reader(in_compressed_buf, header_, DBMS_TCP_PROTOCOL_VERSION)
@@ -232,7 +232,7 @@ InputReader::InputReader(const String & path, const Block & header_, size_t size
     LOG_TEST(getLogger("TemporaryFileStream"), "Reading {} from {}", header_.dumpStructure(), path);
 }
 
-InputReader::InputReader(const String & path, size_t size)
+TemporaryFileStream::Reader::Reader(const String & path, size_t size)
     : in_file_buf(path, size ? std::min<size_t>(DBMS_DEFAULT_BUFFER_SIZE, size) : DBMS_DEFAULT_BUFFER_SIZE)
     , in_compressed_buf(in_file_buf)
     , in_reader(in_compressed_buf, DBMS_TCP_PROTOCOL_VERSION)
@@ -240,7 +240,7 @@ InputReader::InputReader(const String & path, size_t size)
     LOG_TEST(getLogger("TemporaryFileStream"), "Reading from {}", path);
 }
 
-Block InputReader::read()
+Block TemporaryFileStream::Reader::read()
 {
     return in_reader.read();
 }
@@ -305,15 +305,7 @@ TemporaryFileStream::Stat TemporaryFileStream::finishWriting()
 
 TemporaryFileStream::Stat TemporaryFileStream::finishWritingAsyncSafe()
 {
-    if (!writing_finished.load(std::memory_order_relaxed))
-    {
-        std::lock_guard lock(finish_writing);
-        if (!writing_finished.load())
-        {
-            return finishWriting();
-        }
-        writing_finished.store(true);
-    }
+    std::call_once(finish_writing, [this]{ finishWriting(); });
     return stat;
 }
 
@@ -333,7 +325,7 @@ Block TemporaryFileStream::read()
 
     if (!in_reader)
     {
-        in_reader = std::make_unique<InputReader>(getPath(), header, getSize());
+        in_reader = std::make_unique<Reader>(getPath(), header, getSize());
     }
 
     Block block = in_reader->read();
@@ -341,12 +333,11 @@ Block TemporaryFileStream::read()
     {
         /// finalize earlier to release resources, do not wait for the destructor
         this->release();
-        in_reader.reset();
     }
     return block;
 }
 
-std::unique_ptr<InputReader> TemporaryFileStream::getReadStream()
+std::unique_ptr<TemporaryFileStream::Reader> TemporaryFileStream::getReadStream()
 {
     if (!isWriteFinished())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Writing has been not finished");
@@ -354,7 +345,7 @@ std::unique_ptr<InputReader> TemporaryFileStream::getReadStream()
     if (isEof())
         return nullptr;
 
-    return std::make_unique<InputReader>(getPath(), header, getSize());
+    return std::make_unique<Reader>(getPath(), header, getSize());
 }
 
 void TemporaryFileStream::updateAllocAndCheck()
diff --git a/src/Interpreters/TemporaryDataOnDisk.h b/src/Interpreters/TemporaryDataOnDisk.h
index a5141dd373e..488eed70da9 100644
--- a/src/Interpreters/TemporaryDataOnDisk.h
+++ b/src/Interpreters/TemporaryDataOnDisk.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <atomic>
+#include <mutex>
 #include <boost/noncopyable.hpp>
 
 #include <IO/ReadBufferFromFile.h>
@@ -134,19 +135,6 @@ private:
     typename CurrentMetrics::Metric current_metric_scope = CurrentMetrics::TemporaryFilesUnknown;
 };
 
-struct InputReader
-{
-    InputReader(const String & path, const Block & header_, size_t size = 0);
-
-    explicit InputReader(const String & path, size_t size = 0);
-
-    Block read();
-
-    ReadBufferFromFile in_file_buf;
-    CompressedReadBuffer in_compressed_buf;
-    NativeReader in_reader;
-};
-
 /*
  * Data can be written into this stream and then read.
  * After finish writing, call `finishWriting` and then either call `read` or 'getReadStream'(only one of the two) to read the data.
@@ -155,6 +143,19 @@ struct InputReader
 class TemporaryFileStream : boost::noncopyable
 {
 public:
+    struct Reader
+    {
+        Reader(const String & path, const Block & header_, size_t size = 0);
+
+        explicit Reader(const String & path, size_t size = 0);
+
+        Block read();
+
+        ReadBufferFromFile in_file_buf;
+        CompressedReadBuffer in_compressed_buf;
+        NativeReader in_reader;
+    };
+
     struct Stat
     {
         /// Statistics for file
@@ -174,7 +175,7 @@ public:
     Stat finishWritingAsyncSafe();
     bool isWriteFinished() const;
 
-    std::unique_ptr<InputReader> getReadStream();
+    std::unique_ptr<Reader> getReadStream();
 
     Block read();
 
@@ -204,13 +205,12 @@ private:
 
     Stat stat;
 
-    mutable std::mutex finish_writing;
-    std::atomic_bool writing_finished{false};
+    std::once_flag finish_writing;
 
     struct OutputWriter;
     std::unique_ptr<OutputWriter> out_writer;
 
-    std::unique_ptr<InputReader> in_reader;
+    std::unique_ptr<Reader> in_reader;
 };
 
 }

From 3f5feb1520798af4d3643b6dc9f45ea2a418d7a2 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 7 May 2024 23:53:30 +0200
Subject: [PATCH 139/289] Update test.py

---
 tests/integration/test_disk_over_web_server/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_disk_over_web_server/test.py b/tests/integration/test_disk_over_web_server/test.py
index 15b26c6b09e..dd5163082ef 100644
--- a/tests/integration/test_disk_over_web_server/test.py
+++ b/tests/integration/test_disk_over_web_server/test.py
@@ -44,7 +44,7 @@ def cluster():
             "node5",
             main_configs=["configs/storage_conf.xml"],
             with_nginx=True,
-            allow_analyzer=False,
+            use_old_analyzer=True,
         )
 
         cluster.start()

From 9d27faf8969be78b37bc11d8925391e7ad9d9910 Mon Sep 17 00:00:00 2001
From: Volodya <vova.giro2000@gmail.com>
Date: Tue, 7 May 2024 23:22:16 +0000
Subject: [PATCH 140/289] canonize tests

---
 .../00298_enum_width_and_cast.reference        | 16 ++++++++--------
 .../00730_unicode_terminal_format.reference    | 18 +++++++++---------
 2 files changed, 17 insertions(+), 17 deletions(-)

diff --git a/tests/queries/0_stateless/00298_enum_width_and_cast.reference b/tests/queries/0_stateless/00298_enum_width_and_cast.reference
index 706e3f2ae98..227a7be0a19 100644
--- a/tests/queries/0_stateless/00298_enum_width_and_cast.reference
+++ b/tests/queries/0_stateless/00298_enum_width_and_cast.reference
@@ -5,13 +5,13 @@
 [90m1. [0m│ Hello │ 0 │
 [90m2. [0m│ \     │ 0 │
    └───────┴───┘
-   ┌─[1mx[0m────────┬─[1my[0m─┐
-[90m1. [0m│ Hello    │ 0 │
-[90m2. [0m│ \        │ 0 │
+   ┌─[1mx[0m─────┬─[1my[0m─┐
+[90m1. [0m│ Hello │ 0 │
+[90m2. [0m│ \     │ 0 │
 [90m3. [0m│ 	\t │ 0 │
-   └──────────┴───┘
-   ┌─[1mx[0m────────┬─[1my[0m─┬─[1mtoInt8(x)[0m─┬─[1ms[0m─────┬─[1mcasted[0m─┐
-[90m1. [0m│ Hello    │ 0 │      -100 │ Hello │ Hello  │
-[90m2. [0m│ \        │ 0 │         0 │ \     │ \      │
+   └───────┴───┘
+   ┌─[1mx[0m─────┬─[1my[0m─┬─[1mtoInt8(x)[0m─┬─[1ms[0m─────┬─[1mcasted[0m─┐
+[90m1. [0m│ Hello │ 0 │      -100 │ Hello │ Hello  │
+[90m2. [0m│ \     │ 0 │         0 │ \     │ \      │
 [90m3. [0m│ 	\t │ 0 │       111 │ 	\t │ 	\t  │
-   └──────────┴───┴───────────┴───────┴────────┘
+   └───────┴───┴───────────┴───────┴────────┘
diff --git a/tests/queries/0_stateless/00730_unicode_terminal_format.reference b/tests/queries/0_stateless/00730_unicode_terminal_format.reference
index 0bf728b0743..d64fbe57e9e 100644
--- a/tests/queries/0_stateless/00730_unicode_terminal_format.reference
+++ b/tests/queries/0_stateless/00730_unicode_terminal_format.reference
@@ -63,11 +63,11 @@
     ┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
 13. │ Ahoj │ Tento kód můžete upravit a spustit │
     └──────┴────────────────────────────────────┘
-    ┏━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━┓
-    ┃ c1          ┃ c2                    ┃
-    ┡━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━┩
+    ┏━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━┓
+    ┃ c1              ┃ c2                    ┃
+    ┡━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━┩
 14. │ Tabs 	 Tabs │ Non-first 	 Tabs │
-    └─────────────┴───────────────────────┘
+    └─────────────────┴───────────────────────┘
     ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
     ┃ c1                                  ┃ c2                                                                                  ┃
     ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
@@ -78,11 +78,11 @@
     ┡━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━┩
 16. │ Russian ё and ё  │ Zero bytes     in middle │
     └──────────────────┴────────────────────────┘
-   ┏━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
-   ┃ 'Tabs \t Tabs' ┃ 'Long\tTitle' ┃
-   ┡━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
-1. │ Tabs 	 Tabs    │ Long	Title    │
-   └────────────────┴───────────────┘
+   ┏━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
+   ┃ 'Tabs \t Tabs'   ┃ 'Long\tTitle' ┃
+   ┡━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
+1. │ Tabs 	 Tabs │ Long	Title │
+   └──────────────────┴───────────────┘
 Row 1:
 ──────
 '你好': 你好

From f4e26052086fc370ad65f729099568e7d8549247 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 8 May 2024 04:10:01 +0200
Subject: [PATCH 141/289] Insert symbols info to the CI database

---
 tests/ci/ci.py                                | 37 ++++++++++++++++++-
 .../prepare-time-trace/prepare-time-trace.sh  | 32 ++++++++++++++++
 2 files changed, 67 insertions(+), 2 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index d6b1866c563..1229ec33a25 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1745,7 +1745,7 @@ def _upload_build_profile_data(
         profile_data_file = Path(TEMP_PATH) / "profile.json"
         with open(profile_data_file, "wb") as profile_fd:
             for profile_source in profiles_dir.iterdir():
-                if profile_source.name != "binary_sizes.txt":
+                if profile_source.name != "binary_sizes.txt" and profile_source.name != "binary_symbols.txt":
                     with open(profiles_dir / profile_source, "rb") as ps_fd:
                         profile_fd.write(ps_fd.read())
 
@@ -1787,7 +1787,40 @@ def _upload_build_profile_data(
         try:
             ch_helper.insert_file(url, auth, query, binary_sizes_file)
         except InsertException:
-            logging.error("Failed to insert binary_size_file for the build, continue")
+            logging.error("Failed to insert binary_sizes_file for the build, continue")
+
+        query = f"""INSERT INTO binary_symbols
+            (
+                pull_request_number,
+                commit_sha,
+                check_start_time,
+                check_name,
+                instance_type,
+                instance_id,
+                file,
+                address,
+                size,
+                type,
+                symbol,
+            )
+            SELECT {pr_info.number}, '{pr_info.sha}', '{job_report.start_time}', '{build_name}', '{instance_type}', '{instance_id}',
+                file, reinterpretAsUInt64(reverse(unhex(address))), reinterpretAsUInt64(reverse(unhex(size))), type, symbol
+            FROM input('file String, address String, size String, type String, symbol String')
+            SETTINGS format_regexp = '^([^ ]+) ([0-9a-fA-F]+) ([0-9a-fA-F]+) (.) (.+)$'
+            FORMAT Regexp"""
+
+        binary_symbols_file = profiles_dir / "binary_symbols.txt"
+
+        print(
+            "::notice ::Log Uploading binary symbols data, path: %s, size: %s, query: %s",
+            binary_symbols_file,
+            binary_symbols_file.stat().st_size,
+            query,
+        )
+        try:
+            ch_helper.insert_file(url, auth, query, binary_symbols_file)
+        except InsertException:
+            logging.error("Failed to insert binary_symbols_file for the build, continue")
 
 
 def _add_build_to_version_history(
diff --git a/utils/prepare-time-trace/prepare-time-trace.sh b/utils/prepare-time-trace/prepare-time-trace.sh
index 812928e8bd8..2ecc1ddcd64 100755
--- a/utils/prepare-time-trace/prepare-time-trace.sh
+++ b/utils/prepare-time-trace/prepare-time-trace.sh
@@ -82,3 +82,35 @@ ORDER BY (date, file, pull_request_number, commit_sha, check_name);
 ///
 
 find "$INPUT_DIR" -type f -executable -or -name '*.o' -or -name '*.a' | grep -v cargo | xargs wc -c | grep -v 'total' > "${OUTPUT_DIR}/binary_sizes.txt"
+
+# Additionally, collect information about the symbols inside translation units
+true<<///
+CREATE TABLE binary_symbols
+(
+   -- Extra columns:
+   pull_request_number UInt32,
+   commit_sha String,
+   check_start_time DateTime,
+   check_name LowCardinality(String),
+   instance_type LowCardinality(String),
+   instance_id String,
+
+   -- Normal columns:
+   file LowCardinality(String),
+   library LowCardinality(String) DEFAULT extract(file, 'CMakeFiles/([^/]+)\.dir/'),
+   address UInt64,
+   size UInt64,
+   type FixedString(1),
+   symbol LowCardinality(String),
+   date Date DEFAULT toDate(time),
+   time DateTime64(6) DEFAULT now64()
+)
+ENGINE = MergeTree
+ORDER BY (date, file, symbol, pull_request_number, commit_sha, check_name);
+///
+
+find "$INPUT_DIR" -type f -name '*.o' | grep -v cargo | find . -name '*.o' | xargs -P $(nproc) -I {} bash -c "
+  nm --demangle --defined-only --print-size '{}' | grep -v -P '[0-9a-zA-Z] r ' | sed 's@^@{} @' > '{}.symbols'
+"
+
+find "$INPUT_DIR" -type f -name '*.o.symbols' | xargs cat > "${OUTPUT_DIR}/binary_symbols.txt"

From 9c449cc4535fa7147a65ca9ff4a2eb4a37620323 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 8 May 2024 04:18:01 +0200
Subject: [PATCH 142/289] Insert symbols info to the CI database

---
 tests/ci/ci.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 1229ec33a25..ddad84d3e3e 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1806,7 +1806,7 @@ def _upload_build_profile_data(
             SELECT {pr_info.number}, '{pr_info.sha}', '{job_report.start_time}', '{build_name}', '{instance_type}', '{instance_id}',
                 file, reinterpretAsUInt64(reverse(unhex(address))), reinterpretAsUInt64(reverse(unhex(size))), type, symbol
             FROM input('file String, address String, size String, type String, symbol String')
-            SETTINGS format_regexp = '^([^ ]+) ([0-9a-fA-F]+) ([0-9a-fA-F]+) (.) (.+)$'
+            SETTINGS format_regexp = '^([^ ]+) ([0-9a-fA-F]+)(?: ([0-9a-fA-F]+))? (.) (.+)$'
             FORMAT Regexp"""
 
         binary_symbols_file = profiles_dir / "binary_symbols.txt"

From dc0df8cfec4d9c616a8c4f54489f57136691dbe9 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Wed, 8 May 2024 02:31:32 +0000
Subject: [PATCH 143/289] Automatic style fix

---
 tests/ci/ci.py | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index ddad84d3e3e..7779f8d7349 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1745,7 +1745,10 @@ def _upload_build_profile_data(
         profile_data_file = Path(TEMP_PATH) / "profile.json"
         with open(profile_data_file, "wb") as profile_fd:
             for profile_source in profiles_dir.iterdir():
-                if profile_source.name != "binary_sizes.txt" and profile_source.name != "binary_symbols.txt":
+                if (
+                    profile_source.name != "binary_sizes.txt"
+                    and profile_source.name != "binary_symbols.txt"
+                ):
                     with open(profiles_dir / profile_source, "rb") as ps_fd:
                         profile_fd.write(ps_fd.read())
 
@@ -1820,7 +1823,9 @@ def _upload_build_profile_data(
         try:
             ch_helper.insert_file(url, auth, query, binary_symbols_file)
         except InsertException:
-            logging.error("Failed to insert binary_symbols_file for the build, continue")
+            logging.error(
+                "Failed to insert binary_symbols_file for the build, continue"
+            )
 
 
 def _add_build_to_version_history(

From f9da558a2c9f37ae4967f352d18f7b9f1fe91e65 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 8 May 2024 05:20:07 +0200
Subject: [PATCH 144/289] Your lint

---
 tests/ci/ci.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 7779f8d7349..11803a5bc26 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1745,10 +1745,7 @@ def _upload_build_profile_data(
         profile_data_file = Path(TEMP_PATH) / "profile.json"
         with open(profile_data_file, "wb") as profile_fd:
             for profile_source in profiles_dir.iterdir():
-                if (
-                    profile_source.name != "binary_sizes.txt"
-                    and profile_source.name != "binary_symbols.txt"
-                ):
+                if profile_source.name not in ('binary_sizes.txt', 'binary_symbols.txt'):
                     with open(profiles_dir / profile_source, "rb") as ps_fd:
                         profile_fd.write(ps_fd.read())
 

From 71eab76f5cd8574d302a2edb81f1efaa57230919 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Wed, 8 May 2024 03:31:41 +0000
Subject: [PATCH 145/289] Automatic style fix

---
 tests/ci/ci.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 11803a5bc26..5f42309d439 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1745,7 +1745,10 @@ def _upload_build_profile_data(
         profile_data_file = Path(TEMP_PATH) / "profile.json"
         with open(profile_data_file, "wb") as profile_fd:
             for profile_source in profiles_dir.iterdir():
-                if profile_source.name not in ('binary_sizes.txt', 'binary_symbols.txt'):
+                if profile_source.name not in (
+                    "binary_sizes.txt",
+                    "binary_symbols.txt",
+                ):
                     with open(profiles_dir / profile_source, "rb") as ps_fd:
                         profile_fd.write(ps_fd.read())
 

From 195ea4ec1fad72a5043f3414b7a7def110312ca5 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 8 May 2024 09:25:38 +0200
Subject: [PATCH 146/289] Use ThreadPoolCallbackRunnerLocal in
 MergeTreePrefetchedReadPool

---
 .../MergeTree/MergeTreePrefetchedReadPool.cpp | 59 +++++--------------
 .../MergeTree/MergeTreePrefetchedReadPool.h   | 11 ++--
 2 files changed, 22 insertions(+), 48 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
index 6d2875b8d9f..ebd19093f68 100644
--- a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
+++ b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
@@ -46,49 +46,30 @@ bool MergeTreePrefetchedReadPool::TaskHolder::operator<(const TaskHolder & other
 }
 
 
-MergeTreePrefetchedReadPool::PrefetchedReaders::~PrefetchedReaders()
-{
-    for (auto & prefetch_future : prefetch_futures)
-        if (prefetch_future.valid())
-            prefetch_future.wait();
-}
-
 MergeTreePrefetchedReadPool::PrefetchedReaders::PrefetchedReaders(
+    ThreadPool & pool,
     MergeTreeReadTask::Readers readers_,
     Priority priority_,
-    MergeTreePrefetchedReadPool & pool_)
+    MergeTreePrefetchedReadPool & read_prefetch)
     : is_valid(true)
     , readers(std::move(readers_))
+    , prefetch_runner(pool, "Prefetch")
 {
-    try
+    prefetch_runner(read_prefetch.createPrefetchedTask(readers.main.get(), priority_));
+
+    for (const auto & reader : readers.prewhere)
+        prefetch_runner(read_prefetch.createPrefetchedTask(reader.get(), priority_));
+
+    fiu_do_on(FailPoints::prefetched_reader_pool_failpoint,
     {
-        prefetch_futures.reserve(1 + readers.prewhere.size());
-
-        prefetch_futures.push_back(pool_.createPrefetchedFuture(readers.main.get(), priority_));
-
-        for (const auto & reader : readers.prewhere)
-            prefetch_futures.push_back(pool_.createPrefetchedFuture(reader.get(), priority_));
-
-        fiu_do_on(FailPoints::prefetched_reader_pool_failpoint,
-        {
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Failpoint for prefetched reader enabled");
-        });
-    }
-    catch (...) /// in case of memory exceptions we have to wait
-    {
-        for (auto & prefetch_future : prefetch_futures)
-            if (prefetch_future.valid())
-                prefetch_future.wait();
-
-        throw;
-    }
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Failpoint for prefetched reader enabled");
+    });
 }
 
 void MergeTreePrefetchedReadPool::PrefetchedReaders::wait()
 {
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::WaitPrefetchTaskMicroseconds);
-    for (auto & prefetch_future : prefetch_futures)
-        prefetch_future.wait();
+    prefetch_runner.waitForAllToFinish();
 }
 
 MergeTreeReadTask::Readers MergeTreePrefetchedReadPool::PrefetchedReaders::get()
@@ -96,13 +77,7 @@ MergeTreeReadTask::Readers MergeTreePrefetchedReadPool::PrefetchedReaders::get()
     SCOPE_EXIT({ is_valid = false; });
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::WaitPrefetchTaskMicroseconds);
 
-    /// First wait for completion of all futures.
-    for (auto & prefetch_future : prefetch_futures)
-        prefetch_future.wait();
-
-    /// Then rethrow first exception if any.
-    for (auto & prefetch_future : prefetch_futures)
-        prefetch_future.get();
+    prefetch_runner.waitForAllToFinishAndRethrowFirstError();
 
     return std::move(readers);
 }
@@ -139,7 +114,7 @@ MergeTreePrefetchedReadPool::MergeTreePrefetchedReadPool(
     fillPerThreadTasks(pool_settings.threads, pool_settings.sum_marks);
 }
 
-std::future<void> MergeTreePrefetchedReadPool::createPrefetchedFuture(IMergeTreeReader * reader, Priority priority)
+std::function<void()> MergeTreePrefetchedReadPool::createPrefetchedTask(IMergeTreeReader * reader, Priority priority)
 {
     /// In order to make a prefetch we need to wait for marks to be loaded. But we just created
     /// a reader (which starts loading marks in its constructor), then if we do prefetch right
@@ -147,14 +122,12 @@ std::future<void> MergeTreePrefetchedReadPool::createPrefetchedFuture(IMergeTree
     /// only inside this MergeTreePrefetchedReadPool, where read tasks are created and distributed,
     /// and we cannot block either, therefore make prefetch inside the pool and put the future
     /// into the thread task. When a thread calls getTask(), it will wait for it is not ready yet.
-    auto task = [=, context = getContext()]() mutable
+    return [=, context = getContext()]() mutable
     {
         /// For async read metrics in system.query_log.
         PrefetchIncrement watch(context->getAsyncReadCounters());
         reader->prefetchBeginOfRange(priority);
     };
-
-    return scheduleFromThreadPoolUnsafe<void>(std::move(task), prefetch_threadpool, "ReadPrepare", priority);
 }
 
 void MergeTreePrefetchedReadPool::createPrefetchedReadersForTask(ThreadTask & task)
@@ -164,7 +137,7 @@ void MergeTreePrefetchedReadPool::createPrefetchedReadersForTask(ThreadTask & ta
 
     auto extras = getExtras();
     auto readers = MergeTreeReadTask::createReaders(task.read_info, extras, task.ranges);
-    task.readers_future = std::make_unique<PrefetchedReaders>(std::move(readers), task.priority, *this);
+    task.readers_future = std::make_unique<PrefetchedReaders>(prefetch_threadpool, std::move(readers), task.priority, *this);
 }
 
 void MergeTreePrefetchedReadPool::startPrefetches()
diff --git a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.h b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.h
index 0c8a6716d40..a3a57227630 100644
--- a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.h
+++ b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.h
@@ -1,5 +1,6 @@
 #pragma once
 #include <Storages/MergeTree/MergeTreeReadPoolBase.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Common/ThreadPool_fwd.h>
 #include <IO/AsyncReadCounters.h>
 #include <boost/heap/priority_queue.hpp>
@@ -51,18 +52,18 @@ private:
     class PrefetchedReaders
     {
     public:
-        PrefetchedReaders() = default;
-        PrefetchedReaders(MergeTreeReadTask::Readers readers_, Priority priority_, MergeTreePrefetchedReadPool & pool_);
+        PrefetchedReaders(
+            ThreadPool & pool, MergeTreeReadTask::Readers readers_, Priority priority_, MergeTreePrefetchedReadPool & read_prefetch);
 
         void wait();
         MergeTreeReadTask::Readers get();
         bool valid() const { return is_valid; }
-        ~PrefetchedReaders();
 
     private:
         bool is_valid = false;
         MergeTreeReadTask::Readers readers;
-        std::vector<std::future<void>> prefetch_futures;
+
+        ThreadPoolCallbackRunnerLocal<void> prefetch_runner;
     };
 
     struct ThreadTask
@@ -108,7 +109,7 @@ private:
 
     void startPrefetches();
     void createPrefetchedReadersForTask(ThreadTask & task);
-    std::future<void> createPrefetchedFuture(IMergeTreeReader * reader, Priority priority);
+    std::function<void()> createPrefetchedTask(IMergeTreeReader * reader, Priority priority);
 
     MergeTreeReadTaskPtr stealTask(size_t thread, MergeTreeReadTask * previous_task);
     MergeTreeReadTaskPtr createTask(ThreadTask & thread_task, MergeTreeReadTask * previous_task);

From c3d01a91d544b639eafd4991096c5b8757441d1f Mon Sep 17 00:00:00 2001
From: Yohann Jardin <yohann.jardin@telecomnancy.net>
Date: Wed, 8 May 2024 09:31:06 +0200
Subject: [PATCH 147/289] empty commit


From 49e26015afe5cb9c5c2041382148f9f8b4f88ad9 Mon Sep 17 00:00:00 2001
From: Duyet Le <5009534+duyet@users.noreply.github.com>
Date: Wed, 8 May 2024 14:39:29 +0700
Subject: [PATCH 148/289] Add clickhouse-monitoring as third-party GUI

---
 docs/en/interfaces/third-party/gui.md | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/docs/en/interfaces/third-party/gui.md b/docs/en/interfaces/third-party/gui.md
index be2d028e87f..d7cc8b1acc1 100644
--- a/docs/en/interfaces/third-party/gui.md
+++ b/docs/en/interfaces/third-party/gui.md
@@ -210,6 +210,17 @@ Features:
 - Pre-built metrics dashboards.
 - Multiple users/projects via YAML config.
 
+### clickhouse-monitoring {#clickhouse-monitoring}
+
+[clickhouse-monitoring](https://github.com/duyet/clickhouse-monitoring) is a simple Next.js dashboard that relies on `system.*` tables to help monitor and provide an overview of your ClickHouse cluster.
+
+Features:
+
+- Query monitor: current queries, query history, query resources (memory, parts read, file_open, ...), most expensive queries, most used tables or columns, etc.
+- Cluster monitor: total memory/CPU usage, distributed queue, global settings, mergetree settings, metrics, etc.
+- Tables and parts information: size, row count, compression, part size, etc., at the column level detail.
+- Visualization metric charts: total queries, memory usage, number of merges, number of parts, etc.
+
 ## Commercial {#commercial}
 
 ### DataGrip {#datagrip}

From b57ad0f0eb1063cd3e525c76514ed2159578810d Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Wed, 8 May 2024 09:58:01 +0200
Subject: [PATCH 149/289] Analyzer fix
 03024_total_rows_approx_is_set_for_system_zeros_and_generate_random

---
 src/Planner/PlannerJoinTree.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 514c19b0f89..bf1ebe6740b 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -691,6 +691,9 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
                 {
                     if (max_block_size_limited < select_query_info.local_storage_limits.local_limits.size_limits.max_rows)
                         table_expression_query_info.limit = max_block_size_limited;
+                    /// Ask to read just enough rows to make the max_rows limit effective (so it has a chance to be triggered).
+                    else if (select_query_info.local_storage_limits.local_limits.size_limits.max_rows < std::numeric_limits<UInt64>::max())
+                        table_expression_query_info.limit = 1 + select_query_info.local_storage_limits.local_limits.size_limits.max_rows;
                 }
                 else
                 {

From 70c64196512b24388ff85bca9bdda08e9d3cc87c Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 8 May 2024 12:51:22 +0200
Subject: [PATCH 150/289] Standardize file name for null-functions and add
 isNullable function

---
 .../aggregate-functions/index.md              |  2 +-
 ...nctions-for-nulls.md => null-functions.md} | 43 ++++++++++++++++++-
 .../sql-reference/statements/select/where.md  |  2 +-
 ...nctions-for-nulls.md => null-functions.md} |  4 +-
 .../sql-reference/statements/select/where.md  |  2 +-
 ...nctions-for-nulls.md => null-functions.md} |  4 +-
 .../sql-reference/statements/select/where.md  |  2 +-
 7 files changed, 50 insertions(+), 9 deletions(-)
 rename docs/en/sql-reference/functions/{functions-for-nulls.md => null-functions.md} (84%)
 rename docs/ru/sql-reference/functions/{functions-for-nulls.md => null-functions.md} (98%)
 rename docs/zh/sql-reference/functions/{functions-for-nulls.md => null-functions.md} (97%)

diff --git a/docs/en/sql-reference/aggregate-functions/index.md b/docs/en/sql-reference/aggregate-functions/index.md
index 96bf0c5d93b..bf9ea28daa0 100644
--- a/docs/en/sql-reference/aggregate-functions/index.md
+++ b/docs/en/sql-reference/aggregate-functions/index.md
@@ -60,7 +60,7 @@ SELECT groupArray(y) FROM t_null_big
 
 `groupArray` does not include `NULL` in the resulting array.
 
-You can use [COALESCE](../../sql-reference/functions/functions-for-nulls.md#coalesce) to change NULL into a value that makes sense in your use case. For example: `avg(COALESCE(column, 0))` with use the column value in the aggregation or zero if NULL:
+You can use [COALESCE](../../sql-reference/functions/null-functions.md#coalesce) to change NULL into a value that makes sense in your use case. For example: `avg(COALESCE(column, 0))` with use the column value in the aggregation or zero if NULL:
 
 ``` sql
 SELECT
diff --git a/docs/en/sql-reference/functions/functions-for-nulls.md b/docs/en/sql-reference/functions/null-functions.md
similarity index 84%
rename from docs/en/sql-reference/functions/functions-for-nulls.md
rename to docs/en/sql-reference/functions/null-functions.md
index 4dfbf4262ed..6220e08ce2d 100644
--- a/docs/en/sql-reference/functions/functions-for-nulls.md
+++ b/docs/en/sql-reference/functions/null-functions.md
@@ -1,5 +1,5 @@
 ---
-slug: /en/sql-reference/functions/functions-for-nulls
+slug: /en/sql-reference/functions/null-functions
 sidebar_position: 135
 sidebar_label: Nullable
 ---
@@ -12,6 +12,8 @@ Returns whether the argument is [NULL](../../sql-reference/syntax.md#null).
 
 See also operator [`IS NULL`](../operators/index.md#is_null).
 
+**Syntax**
+
 ``` sql
 isNull(x)
 ```
@@ -52,6 +54,45 @@ Result:
 └───┘
 ```
 
+## isNullable
+
+Returns `1` if a column allows null values, `0` otherwise.
+
+**Syntax**
+
+``` sql
+isNullable(x)
+```
+
+**Arguments**
+
+- `x` — column.
+
+**Returned value**
+
+- `1` if `x` allows `NULL` values. [UInt8](../data-types/int-uint.md).
+- `0` if `x` does not allow `NULL` values. [UInt8](../data-types/int-uint.md).
+
+**Example**
+
+Query:
+
+``` sql
+CREATE TABLE example_table (nullable_column Nullable(UInt32), ordinary_column UInt32) ENGINE = Log;
+INSERT INTO example_table (nullable_column, ordinary_column) VALUES (1,1), (2, 2), (3,3);
+SELECT isNullable(nullable_column), isNullable(ordinary_column) FROM example_table;    
+```
+
+Result:
+
+``` text
+   ┌─isNullable(nullable_column)─┬─isNullable(ordinary_column)─┐
+1. │                           1 │                           0 │
+2. │                           1 │                           0 │
+3. │                           1 │                           0 │
+   └─────────────────────────────┴─────────────────────────────┘
+```
+
 ## isNotNull
 
 Returns whether the argument is not [NULL](../../sql-reference/syntax.md#null-literal).
diff --git a/docs/en/sql-reference/statements/select/where.md b/docs/en/sql-reference/statements/select/where.md
index a585942f07f..5be05c1d36d 100644
--- a/docs/en/sql-reference/statements/select/where.md
+++ b/docs/en/sql-reference/statements/select/where.md
@@ -15,7 +15,7 @@ If there is a `WHERE` clause, it must contain an expression with the `UInt8` typ
 There is a filtering optimization called [PREWHERE](../../../sql-reference/statements/select/prewhere.md).
 :::
 
-If you need to test a value for [NULL](../../../sql-reference/syntax.md#null-literal), use [IS NULL](../../operators/index.md#operator-is-null) and [IS NOT NULL](../../operators/index.md#is-not-null) operators or [isNull](../../../sql-reference/functions/functions-for-nulls.md#isnull) and [isNotNull](../../../sql-reference/functions/functions-for-nulls.md#isnotnull) functions.
+If you need to test a value for [NULL](../../../sql-reference/syntax.md#null-literal), use [IS NULL](../../operators/index.md#operator-is-null) and [IS NOT NULL](../../operators/index.md#is-not-null) operators or [isNull](../../../sql-reference/functions/null-functions.md#isnull) and [isNotNull](../../../sql-reference/functions/null-functions.md#isnotnull) functions.
 Otherwise an expression with `NULL` never passes.
 
 **Example**
diff --git a/docs/ru/sql-reference/functions/functions-for-nulls.md b/docs/ru/sql-reference/functions/null-functions.md
similarity index 98%
rename from docs/ru/sql-reference/functions/functions-for-nulls.md
rename to docs/ru/sql-reference/functions/null-functions.md
index 7934b0f68c9..d1c26f117ec 100644
--- a/docs/ru/sql-reference/functions/functions-for-nulls.md
+++ b/docs/ru/sql-reference/functions/null-functions.md
@@ -1,5 +1,5 @@
 ---
-slug: /ru/sql-reference/functions/functions-for-nulls
+slug: /ru/sql-reference/functions/null-functions
 sidebar_position: 63
 sidebar_label: "Функции для работы с Nullable-аргументами"
 ---
@@ -212,7 +212,7 @@ SELECT nullIf(1, 2);
 
 ## assumeNotNull {#assumenotnull}
 
-Приводит значение типа [Nullable](../../sql-reference/functions/functions-for-nulls.md) к не `Nullable`, если значение не `NULL`.
+Приводит значение типа [Nullable](../../sql-reference/functions/null-functions.md) к не `Nullable`, если значение не `NULL`.
 
 ``` sql
 assumeNotNull(x)
diff --git a/docs/ru/sql-reference/statements/select/where.md b/docs/ru/sql-reference/statements/select/where.md
index 10057cdeb84..5b3ba01f00e 100644
--- a/docs/ru/sql-reference/statements/select/where.md
+++ b/docs/ru/sql-reference/statements/select/where.md
@@ -14,7 +14,7 @@ ClickHouse использует в выражении индексы, если 
 :::note Примечание
 Существует оптимизация фильтрации под названием [PREWHERE](prewhere.md).
 :::
-Если в секции необходимо проверить [NULL](../../../sql-reference/syntax.md#null-literal), то используйте операторы [IS NULL](../../operators/index.md#operator-is-null) и [IS NOT NULL](../../operators/index.md#is-not-null), а также соответствующие функции [isNull](../../../sql-reference/functions/functions-for-nulls.md#isnull) и [isNotNull](../../../sql-reference/functions/functions-for-nulls.md#isnotnull). В противном случае выражение будет считаться всегда не выполненным.
+Если в секции необходимо проверить [NULL](../../../sql-reference/syntax.md#null-literal), то используйте операторы [IS NULL](../../operators/index.md#operator-is-null) и [IS NOT NULL](../../operators/index.md#is-not-null), а также соответствующие функции [isNull](../../../sql-reference/functions/null-functions.md#isnull) и [isNotNull](../../../sql-reference/functions/full-functions.md#isnotnull). В противном случае выражение будет считаться всегда не выполненным.
 
 **Пример**
 
diff --git a/docs/zh/sql-reference/functions/functions-for-nulls.md b/docs/zh/sql-reference/functions/null-functions.md
similarity index 97%
rename from docs/zh/sql-reference/functions/functions-for-nulls.md
rename to docs/zh/sql-reference/functions/null-functions.md
index b3dca3ac549..1c38dbb6030 100644
--- a/docs/zh/sql-reference/functions/functions-for-nulls.md
+++ b/docs/zh/sql-reference/functions/null-functions.md
@@ -1,5 +1,5 @@
 ---
-slug: /zh/sql-reference/functions/functions-for-nulls
+slug: /zh/sql-reference/functions/null-functions
 ---
 # Nullable处理函数 {#nullablechu-li-han-shu}
 
@@ -181,7 +181,7 @@ SELECT coalesce(mail, phone, CAST(icq,'Nullable(String)')) FROM aBook
 
 ## assumeNotNull {#assumenotnull}
 
-将[可为空](../../sql-reference/functions/functions-for-nulls.md)类型的值转换为非`Nullable`类型的值。
+将[可为空](../../sql-reference/functions/null-functions.md)类型的值转换为非`Nullable`类型的值。
 
     assumeNotNull(x)
 
diff --git a/docs/zh/sql-reference/statements/select/where.md b/docs/zh/sql-reference/statements/select/where.md
index 6c7183840c7..ac3debb799e 100644
--- a/docs/zh/sql-reference/statements/select/where.md
+++ b/docs/zh/sql-reference/statements/select/where.md
@@ -15,7 +15,7 @@ sidebar_label: WHERE
 有一个叫做过滤优化 [prewhere](../../../sql-reference/statements/select/prewhere.md) 的东西.
 :::
 
-如果需要测试一个 [NULL](../../../sql-reference/syntax.md#null-literal) 值，请使用 [IS NULL](../../operators/index.md#operator-is-null) and [IS NOT NULL](../../operators/index.md#is-not-null) 运算符或 [isNull](../../../sql-reference/functions/functions-for-nulls.md#isnull) 和 [isNotNull](../../../sql-reference/functions/functions-for-nulls.md#isnotnull) 函数。否则带有 NULL 的表达式永远不会通过。
+如果需要测试一个 [NULL](../../../sql-reference/syntax.md#null-literal) 值，请使用 [IS NULL](../../operators/index.md#operator-is-null) and [IS NOT NULL](../../operators/index.md#is-not-null) 运算符或 [isNull](../../../sql-reference/functions/null-functions.md#isnull) 和 [isNotNull](../../../sql-reference/functions/null-functions.md#isnotnull) 函数。否则带有 NULL 的表达式永远不会通过。
 
 **示例**
 

From 173d5d0b98e6bcdf1b97ddf31152a5a6b76b3841 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 8 May 2024 12:15:54 +0200
Subject: [PATCH 151/289] Keep parent part alive for read task

---
 .../MergeTree/MergeTreePrefetchedReadPool.cpp  |  2 +-
 .../MergeTree/MergeTreeReadPoolBase.cpp        | 18 ++++++++++++++++++
 src/Storages/MergeTree/MergeTreeReadTask.h     |  2 ++
 3 files changed, 21 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
index ebd19093f68..91cbdc79624 100644
--- a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
+++ b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
@@ -53,7 +53,7 @@ MergeTreePrefetchedReadPool::PrefetchedReaders::PrefetchedReaders(
     MergeTreePrefetchedReadPool & read_prefetch)
     : is_valid(true)
     , readers(std::move(readers_))
-    , prefetch_runner(pool, "Prefetch")
+    , prefetch_runner(pool, "ReadPrepare")
 {
     prefetch_runner(read_prefetch.createPrefetchedTask(readers.main.get(), priority_));
 
diff --git a/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp b/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
index 0cbb0a86b2f..d4b9ce34796 100644
--- a/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
+++ b/src/Storages/MergeTree/MergeTreeReadPoolBase.cpp
@@ -6,6 +6,11 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
 MergeTreeReadPoolBase::MergeTreeReadPoolBase(
     RangesInDataParts && parts_,
     VirtualFields shared_virtual_fields_,
@@ -48,6 +53,19 @@ void MergeTreeReadPoolBase::fillPerPartInfos()
         MergeTreeReadTaskInfo read_task_info;
 
         read_task_info.data_part = part_with_ranges.data_part;
+
+        const auto & data_part = read_task_info.data_part;
+        if (data_part->isProjectionPart())
+        {
+            read_task_info.parent_part = data_part->storage.getPartIfExists(
+                data_part->getParentPartName(),
+                {MergeTreeDataPartState::PreActive, MergeTreeDataPartState::Active, MergeTreeDataPartState::Outdated});
+
+            if (!read_task_info.parent_part)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Did not find parent part {} for projection part {}",
+                            data_part->getParentPartName(), data_part->getDataPartStorage().getFullPath());
+        }
+
         read_task_info.part_index_in_query = part_with_ranges.part_index_in_query;
         read_task_info.alter_conversions = part_with_ranges.alter_conversions;
 
diff --git a/src/Storages/MergeTree/MergeTreeReadTask.h b/src/Storages/MergeTree/MergeTreeReadTask.h
index c8bb501c0e8..3af95b9cdce 100644
--- a/src/Storages/MergeTree/MergeTreeReadTask.h
+++ b/src/Storages/MergeTree/MergeTreeReadTask.h
@@ -56,6 +56,8 @@ struct MergeTreeReadTaskInfo
 {
     /// Data part which should be read while performing this task
     DataPartPtr data_part;
+    /// Parent part of the projection part
+    DataPartPtr parent_part;
     /// For `part_index` virtual column
     size_t part_index_in_query;
     /// Alter converversionss that should be applied on-fly for part.

From 1465d06a96d5e7dc26e9a175d61a994fd71a3e9d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 7 May 2024 20:46:17 +0200
Subject: [PATCH 152/289] Fix for RabbitMQ

---
 src/Storages/RabbitMQ/StorageRabbitMQ.cpp     | 137 ++++++++++--------
 .../integration/test_storage_rabbitmq/test.py |   2 +-
 2 files changed, 79 insertions(+), 60 deletions(-)

diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index b882fd2728c..3367905523a 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -449,69 +449,77 @@ void StorageRabbitMQ::initExchange(AMQP::TcpChannel & rabbit_channel)
     /// 1. `durable` (survive RabbitMQ server restart)
     /// 2. `autodelete` (auto delete in case of queue bindings are dropped).
 
+    std::string error;
     rabbit_channel.declareExchange(exchange_name, exchange_type, AMQP::durable)
     .onError([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /// This error can be a result of attempt to declare exchange if it was already declared but
         /// 1) with different exchange type.
         /// 2) with different exchange settings.
-        throw Exception(ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-                "Unable to declare exchange. Make sure specified exchange is not already declared. Error: {}",
-                std::string(message));
+        error = "Unable to declare exchange. "
+            "Make sure specified exchange is not already declared. Error: " + std::string(message);
     });
 
     rabbit_channel.declareExchange(bridge_exchange, AMQP::fanout, AMQP::durable | AMQP::autodelete)
     .onError([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /// This error is not supposed to happen as this exchange name is always unique to type and its settings.
-        throw Exception(
-                        ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-                        "Unable to declare bridge exchange ({}). Reason: {}", bridge_exchange, std::string(message));
+        if (error.empty())
+            error = fmt::format("Unable to declare bridge exchange ({}). Reason: {}",
+                                bridge_exchange, std::string(message));
     });
 
-    if (!hash_exchange)
+    if (hash_exchange)
+    {
+        AMQP::Table binding_arguments;
+
+        /// Default routing key property in case of hash exchange is a routing key, which is required to be an integer.
+        /// Support for arbitrary exchange type (i.e. arbitrary pattern of routing keys) requires to eliminate this dependency.
+        /// This settings changes hash property to message_id.
+        binding_arguments["hash-property"] = "message_id";
+
+        /// Declare hash exchange for sharding.
+        rabbit_channel.declareExchange(sharding_exchange, AMQP::consistent_hash, AMQP::durable | AMQP::autodelete, binding_arguments)
+        .onError([&](const char * message)
+        {
+            connection->getHandler().stopLoop();
+            /// This error can be a result of same reasons as above for exchange_name, i.e. it will mean that sharding exchange name appeared
+            /// to be the same as some other exchange (which purpose is not for sharding). So probably actual error reason: queue_base parameter
+            /// is bad.
+            if (error.empty())
+                error = fmt::format("Unable to declare sharding exchange ({}). Reason: {}",
+                                    sharding_exchange, std::string(message));
+        });
+
+        rabbit_channel.bindExchange(bridge_exchange, sharding_exchange, routing_keys[0])
+        .onError([&](const char * message)
+        {
+            connection->getHandler().stopLoop();
+            if (error.empty())
+                error = fmt::format(
+                    "Unable to bind bridge exchange ({}) to sharding exchange ({}). Reason: {}",
+                    bridge_exchange, sharding_exchange, std::string(message));
+        });
+
+        consumer_exchange = sharding_exchange;
+    }
+    else
     {
         consumer_exchange = bridge_exchange;
-        return;
     }
 
-    AMQP::Table binding_arguments;
-
-    /// Default routing key property in case of hash exchange is a routing key, which is required to be an integer.
-    /// Support for arbitrary exchange type (i.e. arbitrary pattern of routing keys) requires to eliminate this dependency.
-    /// This settings changes hash property to message_id.
-    binding_arguments["hash-property"] = "message_id";
-
-    /// Declare hash exchange for sharding.
-    rabbit_channel.declareExchange(sharding_exchange, AMQP::consistent_hash, AMQP::durable | AMQP::autodelete, binding_arguments)
-    .onError([&](const char * message)
-    {
-        /// This error can be a result of same reasons as above for exchange_name, i.e. it will mean that sharding exchange name appeared
-        /// to be the same as some other exchange (which purpose is not for sharding). So probably actual error reason: queue_base parameter
-        /// is bad.
-        throw Exception(
-           ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-           "Unable to declare sharding exchange ({}). Reason: {}", sharding_exchange, std::string(message));
-    });
-
-    rabbit_channel.bindExchange(bridge_exchange, sharding_exchange, routing_keys[0])
-    .onError([&](const char * message)
-    {
-        throw Exception(
-            ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-            "Unable to bind bridge exchange ({}) to sharding exchange ({}). Reason: {}",
-            bridge_exchange,
-            sharding_exchange,
-            std::string(message));
-    });
-
-    consumer_exchange = sharding_exchange;
+    connection->getHandler().startBlockingLoop();
+    if (!error.empty())
+        throw Exception(ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE, "{}", error);
 }
 
 
 void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
 {
     size_t bound_keys = 0;
+    std::string error;
 
     if (exchange_type == AMQP::ExchangeType::headers)
     {
@@ -527,10 +535,9 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
         .onSuccess([&]() { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                exchange_name, bridge_exchange, std::string(message));
+            connection->getHandler().stopLoop();
+            error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                exchange_name, bridge_exchange, std::string(message));
         });
     }
     else if (exchange_type == AMQP::ExchangeType::fanout || exchange_type == AMQP::ExchangeType::consistent_hash)
@@ -539,10 +546,10 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
         .onSuccess([&]() { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                exchange_name, bridge_exchange, std::string(message));
+            connection->getHandler().stopLoop();
+            if (error.empty())
+                error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                    exchange_name, bridge_exchange, std::string(message));
         });
     }
     else
@@ -558,20 +565,23 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
             })
             .onError([&](const char * message)
             {
-                throw Exception(
-                    ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                    "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                    exchange_name, bridge_exchange, std::string(message));
+                connection->getHandler().stopLoop();
+                if (error.empty())
+                    error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                        exchange_name, bridge_exchange, std::string(message));
             });
         }
     }
 
     connection->getHandler().startBlockingLoop();
+    if (!error.empty())
+        throw Exception(ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE, "{}", error);
 }
 
 
 void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_channel)
 {
+    std::string error;
     auto success_callback = [&](const std::string &  queue_name, int msgcount, int /* consumercount */)
     {
         queues.emplace_back(queue_name);
@@ -588,23 +598,26 @@ void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_chann
         .onSuccess([&] { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_CREATE_RABBITMQ_QUEUE_BINDING,
-                "Failed to create queue binding for exchange {}. Reason: {}", exchange_name, std::string(message));
+            connection->getHandler().stopLoop();
+            error = fmt::format("Failed to create queue binding for exchange {}. Reason: {}",
+                                exchange_name, std::string(message));
         });
     };
 
     auto error_callback([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /* This error is most likely a result of an attempt to declare queue with different settings if it was declared before. So for a
          * given queue name either deadletter_exchange parameter changed or queue_size changed, i.e. table was declared with different
          * max_block_size parameter. Solution: client should specify a different queue_base parameter or manually delete previously
          * declared queues via any of the various cli tools.
          */
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Failed to declare queue. Probably queue settings are conflicting: "
-                        "max_block_size, deadletter_exchange. Attempt specifying differently those settings "
-                        "or use a different queue_base or manually delete previously declared queues, "
-                        "which  were declared with the same names. ERROR reason: {}", std::string(message));
+         if (error.empty())
+             error = fmt::format(
+                 "Failed to declare queue. Probably queue settings are conflicting: "
+                 "max_block_size, deadletter_exchange. Attempt specifying differently those settings "
+                 "or use a different queue_base or manually delete previously declared queues, "
+                 "which  were declared with the same names. ERROR reason: {}", std::string(message));
     });
 
     AMQP::Table queue_settings;
@@ -642,6 +655,8 @@ void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_chann
     /// and deleting queues should not take place.
     rabbit_channel.declareQueue(queue_name, AMQP::durable, queue_settings).onSuccess(success_callback).onError(error_callback);
     connection->getHandler().startBlockingLoop();
+    if (!error.empty())
+        throw Exception(ErrorCodes::CANNOT_CREATE_RABBITMQ_QUEUE_BINDING, "{}", error);
 }
 
 
@@ -665,6 +680,7 @@ void StorageRabbitMQ::unbindExchange()
 
             stopLoop();
             looping_task->deactivate();
+            std::string error;
 
             auto rabbit_channel = connection->createChannel();
             rabbit_channel->removeExchange(bridge_exchange)
@@ -674,11 +690,14 @@ void StorageRabbitMQ::unbindExchange()
             })
             .onError([&](const char * message)
             {
-                throw Exception(ErrorCodes::CANNOT_REMOVE_RABBITMQ_EXCHANGE, "Unable to remove exchange. Reason: {}", std::string(message));
+                connection->getHandler().stopLoop();
+                error = fmt::format("Unable to remove exchange. Reason: {}", std::string(message));
             });
 
             connection->getHandler().startBlockingLoop();
             rabbit_channel->close();
+            if (!error.empty())
+                throw Exception(ErrorCodes::CANNOT_REMOVE_RABBITMQ_EXCHANGE, "{}", error);
         }
         catch (...)
         {
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 1017e58e50c..63fd3315816 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -2606,7 +2606,7 @@ def test_rabbitmq_bad_args(rabbitmq_cluster):
     connection = pika.BlockingConnection(parameters)
     channel = connection.channel()
     channel.exchange_declare(exchange="f", exchange_type="fanout")
-    instance.query_and_get_error(
+    assert "Unable to declare exchange" in instance.query_and_get_error(
         """
         CREATE TABLE test.drop (key UInt64, value UInt64)
             ENGINE = RabbitMQ

From d2de5875ca66c9894ab3556fdf9874a21123eba8 Mon Sep 17 00:00:00 2001
From: Duyet Le <5009534+duyet@users.noreply.github.com>
Date: Wed, 8 May 2024 18:33:22 +0700
Subject: [PATCH 153/289] chore: update clickhouse-monitoring

---
 docs/en/interfaces/third-party/gui.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/docs/en/interfaces/third-party/gui.md b/docs/en/interfaces/third-party/gui.md
index d7cc8b1acc1..bb326dc5242 100644
--- a/docs/en/interfaces/third-party/gui.md
+++ b/docs/en/interfaces/third-party/gui.md
@@ -219,7 +219,8 @@ Features:
 - Query monitor: current queries, query history, query resources (memory, parts read, file_open, ...), most expensive queries, most used tables or columns, etc.
 - Cluster monitor: total memory/CPU usage, distributed queue, global settings, mergetree settings, metrics, etc.
 - Tables and parts information: size, row count, compression, part size, etc., at the column level detail.
-- Visualization metric charts: total queries, memory usage, number of merges, number of parts, etc.
+- Useful tools: Zookeeper data exploration, query EXPLAIN, kill queries, etc.
+- Visualization metric charts: queries and resource usage, number of merges/mutation, merge performance, query performance, etc.
 
 ## Commercial {#commercial}
 

From 43259c3b8c324a2b6277dabe9de5d7851367864e Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Wed, 8 May 2024 11:40:17 +0000
Subject: [PATCH 154/289] fix test

---
 tests/queries/0_stateless/03101_analyzer_identifiers_3.sql | 2 +-
 tests/queries/0_stateless/03151_where_asterisk.reference   | 1 -
 tests/queries/0_stateless/03151_where_asterisk.sql         | 3 ---
 3 files changed, 1 insertion(+), 5 deletions(-)
 delete mode 100644 tests/queries/0_stateless/03151_where_asterisk.reference
 delete mode 100644 tests/queries/0_stateless/03151_where_asterisk.sql

diff --git a/tests/queries/0_stateless/03101_analyzer_identifiers_3.sql b/tests/queries/0_stateless/03101_analyzer_identifiers_3.sql
index 8cb477ea6bf..77a0f040e88 100644
--- a/tests/queries/0_stateless/03101_analyzer_identifiers_3.sql
+++ b/tests/queries/0_stateless/03101_analyzer_identifiers_3.sql
@@ -39,7 +39,7 @@ SELECT * GROUP BY *;
 -- not ok as every component of ORDER BY may contain ASC/DESC and COLLATE; though can be supported in some sense
 -- but it works
 SELECT * ORDER BY *;
-SELECT * WHERE *;  -- { serverError UNSUPPORTED_METHOD }
+SELECT * WHERE *; -- { serverError BAD_ARGUMENTS }
 
 SELECT '---';
 
diff --git a/tests/queries/0_stateless/03151_where_asterisk.reference b/tests/queries/0_stateless/03151_where_asterisk.reference
deleted file mode 100644
index 8b137891791..00000000000
--- a/tests/queries/0_stateless/03151_where_asterisk.reference
+++ /dev/null
@@ -1 +0,0 @@
-
diff --git a/tests/queries/0_stateless/03151_where_asterisk.sql b/tests/queries/0_stateless/03151_where_asterisk.sql
deleted file mode 100644
index 4b01d6e165c..00000000000
--- a/tests/queries/0_stateless/03151_where_asterisk.sql
+++ /dev/null
@@ -1,3 +0,0 @@
-SET allow_experimental_analyzer = 1;
-
-SELECT * FROM (SELECT 1) t1 WHERE *; -- { serverError BAD_ARGUMENTS }

From 880314fa08b9ca92b3c2a391237942643c46f931 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 8 May 2024 11:49:15 +0000
Subject: [PATCH 155/289] Another case.

---
 src/Analyzer/FunctionNode.h                                | 7 +++++--
 .../03023_group_by_use_nulls_analyzer_crashes.sql          | 2 ++
 2 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/src/Analyzer/FunctionNode.h b/src/Analyzer/FunctionNode.h
index 8d14b7eeb0d..8abffcfc8ee 100644
--- a/src/Analyzer/FunctionNode.h
+++ b/src/Analyzer/FunctionNode.h
@@ -201,8 +201,11 @@ public:
 
     void convertToNullable() override
     {
-        chassert(kind == FunctionKind::ORDINARY);
-        wrap_with_nullable = true;
+        /// Ignore other function kinds.
+        /// We might try to convert aggregate/window function for invalid query
+        /// before the validation happened.
+        if (kind == FunctionKind::ORDINARY)
+            wrap_with_nullable = true;
     }
 
     void dumpTreeImpl(WriteBuffer & buffer, FormatState & format_state, size_t indent) const override;
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
index bba0a27560f..33ad527772b 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
@@ -45,3 +45,5 @@ GROUP BY
 SETTINGS group_by_use_nulls = 1;
 
 SELECT arrayMap(x -> '.', range(number % 10)) AS k FROM remote('127.0.0.{2,3}', numbers(10)) GROUP BY GROUPING SETS ((k)) ORDER BY k settings group_by_use_nulls=1;
+
+SELECT count('Lambda as function parameter') AS c FROM (SELECT ignore(ignore('Lambda as function parameter', 28, 28, 28, 28, 28, 28), 28), materialize('Lambda as function parameter'), 28, 28, 'world', 5 FROM system.numbers WHERE ignore(materialize('Lambda as function parameter'), materialize(toLowCardinality(28)), 28, 28, 28, 28, toUInt128(28)) LIMIT 2) GROUP BY GROUPING SETS ((toLowCardinality(0)), (toLowCardinality(toNullable(28))), (1)) HAVING nullIf(c, 10) < 50 ORDER BY c ASC NULLS FIRST settings group_by_use_nulls=1; -- { serverError ILLEGAL_AGGREGATION }

From b48ee1b949f285f0cb78b2aa5ce0784b49f09f8a Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 8 May 2024 13:56:49 +0200
Subject: [PATCH 156/289] Add isNotDistinctFrom to documentation

---
 .../sql-reference/functions/null-functions.md | 30 +++++++++++++++++++
 .../sql-reference/statements/select/where.md  |  2 +-
 2 files changed, 31 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/null-functions.md b/docs/en/sql-reference/functions/null-functions.md
index 6220e08ce2d..6c39806ecf6 100644
--- a/docs/en/sql-reference/functions/null-functions.md
+++ b/docs/en/sql-reference/functions/null-functions.md
@@ -137,6 +137,36 @@ Result:
 └───┘
 ```
 
+## isNotDistinctFrom
+
+Performs null-safe comparison. Used to compare JOIN keys which contain NULL values in the JOIN ON section.
+This function will consider two `NULL` values as identical and will return `true`, which is distinct from the usual
+equals behavior where comparing two `NULL` values would return `NULL`.
+
+:::note
+This function can only be used as part of a JOIN ON section of a query. The function is unimplemented for any other use.
+:::
+
+**Syntax**
+
+``` sql
+isNotDistinctFrom(x, y)
+```
+
+**Arguments**
+
+- `x` — first JOIN key.
+- `y` — second JOIN key.
+
+**Returned value**
+
+- `true` when `x` and `y` are both `NULL`.
+- `false` otherwise.
+
+**Example**
+
+For a complete example see: [NULL values in JOIN keys](../../sql-reference/statements/select/join#null-values-in-join-keys).
+
 ## isZeroOrNull
 
 Returns whether the argument is 0 (zero) or [NULL](../../sql-reference/syntax.md#null-literal).
diff --git a/docs/ru/sql-reference/statements/select/where.md b/docs/ru/sql-reference/statements/select/where.md
index 5b3ba01f00e..588c56df6af 100644
--- a/docs/ru/sql-reference/statements/select/where.md
+++ b/docs/ru/sql-reference/statements/select/where.md
@@ -14,7 +14,7 @@ ClickHouse использует в выражении индексы, если 
 :::note Примечание
 Существует оптимизация фильтрации под названием [PREWHERE](prewhere.md).
 :::
-Если в секции необходимо проверить [NULL](../../../sql-reference/syntax.md#null-literal), то используйте операторы [IS NULL](../../operators/index.md#operator-is-null) и [IS NOT NULL](../../operators/index.md#is-not-null), а также соответствующие функции [isNull](../../../sql-reference/functions/null-functions.md#isnull) и [isNotNull](../../../sql-reference/functions/full-functions.md#isnotnull). В противном случае выражение будет считаться всегда не выполненным.
+Если в секции необходимо проверить [NULL](../../../sql-reference/syntax.md#null-literal), то используйте операторы [IS NULL](../../operators/index.md#operator-is-null) и [IS NOT NULL](../../operators/index.md#is-not-null), а также соответствующие функции [isNull](../../../sql-reference/functions/null-functions.md#isnull) и [isNotNull](../../../sql-reference/functions/null-functions.md#isnotnull). В противном случае выражение будет считаться всегда не выполненным.
 
 **Пример**
 

From 0efc7c73cfd4c5c2eefe8256d7fe41c2c2a26c84 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 8 May 2024 14:28:06 +0200
Subject: [PATCH 157/289] MergeTreePrefetchedReadPool: Print parent name when
 logging projection parts

---
 .../MergeTree/MergeTreePrefetchedReadPool.cpp   | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
index 6d2875b8d9f..80deed27b8f 100644
--- a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
+++ b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
@@ -384,6 +384,15 @@ void MergeTreePrefetchedReadPool::fillPerPartStatistics()
     }
 }
 
+namespace
+{
+ALWAYS_INLINE inline String getPartNameForLogging(const DataPartPtr & part)
+{
+    return part->isProjectionPart() ? fmt::format("{}.{}", part->name, part->getParentPartName()) : part->name;
+}
+}
+
+
 void MergeTreePrefetchedReadPool::fillPerThreadTasks(size_t threads, size_t sum_marks)
 {
     if (per_part_infos.empty())
@@ -438,7 +447,7 @@ void MergeTreePrefetchedReadPool::fillPerThreadTasks(size_t threads, size_t sum_
         LOG_DEBUG(
             log,
             "Part: {}, sum_marks: {}, approx mark size: {}, prefetch_step_bytes: {}, prefetch_step_marks: {}, (ranges: {})",
-            parts_ranges[i].data_part->name,
+            getPartNameForLogging(parts_ranges[i].data_part),
             part_stat.sum_marks,
             part_stat.approx_size_of_mark,
             settings.filesystem_prefetch_step_bytes,
@@ -522,7 +531,9 @@ void MergeTreePrefetchedReadPool::fillPerThreadTasks(size_t threads, size_t sum_
                     throw Exception(
                         ErrorCodes::LOGICAL_ERROR,
                         "Requested {} marks from part {}, but part has only {} marks",
-                        marks_to_get_from_part, per_part_infos[part_idx]->data_part->name, part_stat.sum_marks);
+                        marks_to_get_from_part,
+                        getPartNameForLogging(per_part_infos[part_idx]->data_part),
+                        part_stat.sum_marks);
                 }
 
                 size_t num_marks_to_get = marks_to_get_from_part;
@@ -598,7 +609,7 @@ std::string MergeTreePrefetchedReadPool::dumpTasks(const TasksPerThread & tasks)
                 result << '\t';
                 result << ++no << ": ";
                 result << "reader future: " << task->isValidReadersFuture() << ", ";
-                result << "part: " << task->read_info->data_part->name << ", ";
+                result << "part: " << getPartNameForLogging(task->read_info->data_part) << ", ";
                 result << "ranges: " << toString(task->ranges);
             }
         }

From 16eb12a321c17259f368d1dc3588a6bdc7de814f Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 8 May 2024 14:58:21 +0200
Subject: [PATCH 158/289] Correctly stop copy tasks when exception thrown

---
 src/Disks/IDisk.cpp | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/src/Disks/IDisk.cpp b/src/Disks/IDisk.cpp
index 14d5f94ef46..0f17aabd210 100644
--- a/src/Disks/IDisk.cpp
+++ b/src/Disks/IDisk.cpp
@@ -151,17 +151,19 @@ void IDisk::copyThroughBuffers(
 {
     ResultsCollector results;
 
+    SCOPE_EXIT_SAFE(
+        for (auto & result : results)
+            result.wait();
+        for (auto & result : results)
+            result.get();  /// May rethrow an exception
+    );
+
     /// Disable parallel write. We already copy in parallel.
     /// Avoid high memory usage. See test_s3_zero_copy_ttl/test.py::test_move_and_s3_memory_usage
     write_settings.s3_allow_parallel_part_upload = false;
     write_settings.azure_allow_parallel_part_upload = false;
 
     asyncCopy(*this, from_path, *to_disk, to_path, copying_thread_pool, results, copy_root_dir, read_settings, write_settings, cancellation_hook);
-
-    for (auto & result : results)
-        result.wait();
-    for (auto & result : results)
-        result.get();  /// May rethrow an exception
 }
 
 
From c187f99dcd28b637a843dde0f1b6f0d867ce02c0 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Wed, 8 May 2024 15:09:00 +0200
Subject: [PATCH 159/289] Add isNullable and isNotDistinctFrom to aspell-ignore

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index a69ca0fb644..9d625ac083b 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -394,6 +394,8 @@ InterserverThreads
 IsPentagon
 IsResClassIII
 IsValid
+isNotDistinctFrom
+isNullable
 JBOD
 JOINed
 JOINs

From 3d5c8db1e07eeba4d5cd13c501bc1b937c058575 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 8 May 2024 15:05:06 +0200
Subject: [PATCH 160/289] Use ThreadPoolCallbackRunnerLocal

---
 src/Disks/IDisk.cpp | 48 +++++++++++----------------------------------
 1 file changed, 11 insertions(+), 37 deletions(-)

diff --git a/src/Disks/IDisk.cpp b/src/Disks/IDisk.cpp
index 0f17aabd210..5f0ca850b40 100644
--- a/src/Disks/IDisk.cpp
+++ b/src/Disks/IDisk.cpp
@@ -4,6 +4,7 @@
 #include <IO/copyData.h>
 #include <Poco/Logger.h>
 #include <Interpreters/Context.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Common/logger_useful.h>
 #include <Common/setThreadName.h>
 #include <Core/ServerUUID.h>
@@ -84,16 +85,12 @@ UInt128 IDisk::getEncryptedFileIV(const String &) const
     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "File encryption is not implemented for disk of type {}", getDataSourceDescription().type);
 }
 
-
-using ResultsCollector = std::vector<std::future<void>>;
-
 void asyncCopy(
     IDisk & from_disk,
     String from_path,
     IDisk & to_disk,
     String to_path,
-    ThreadPool & pool,
-    ResultsCollector & results,
+    ThreadPoolCallbackRunnerLocal<void> & runner,
     bool copy_root_dir,
     const ReadSettings & read_settings,
     const WriteSettings & write_settings,
@@ -101,29 +98,11 @@ void asyncCopy(
 {
     if (from_disk.isFile(from_path))
     {
-        auto promise = std::make_shared<std::promise<void>>();
-        auto future = promise->get_future();
-
-        pool.scheduleOrThrowOnError(
-            [&from_disk, from_path, &to_disk, to_path, &read_settings, &write_settings, promise, thread_group = CurrentThread::getGroup(), &cancellation_hook]()
-            {
-                try
-                {
-                    SCOPE_EXIT_SAFE(if (thread_group) CurrentThread::detachFromGroupIfNotDetached(););
-
-                    if (thread_group)
-                        CurrentThread::attachToGroup(thread_group);
-
-                    from_disk.copyFile(from_path, to_disk, fs::path(to_path) / fileName(from_path), read_settings, write_settings, cancellation_hook);
-                    promise->set_value();
-                }
-                catch (...)
-                {
-                    promise->set_exception(std::current_exception());
-                }
+        runner(
+            [&from_disk, from_path, &to_disk, to_path, &read_settings, &write_settings, &cancellation_hook] {
+                from_disk.copyFile(
+                    from_path, to_disk, fs::path(to_path) / fileName(from_path), read_settings, write_settings, cancellation_hook);
             });
-
-        results.push_back(std::move(future));
     }
     else
     {
@@ -136,7 +115,7 @@ void asyncCopy(
         }
 
         for (auto it = from_disk.iterateDirectory(from_path); it->isValid(); it->next())
-            asyncCopy(from_disk, it->path(), to_disk, dest, pool, results, true, read_settings, write_settings, cancellation_hook);
+            asyncCopy(from_disk, it->path(), to_disk, dest, runner, true, read_settings, write_settings, cancellation_hook);
     }
 }
 
@@ -149,21 +128,16 @@ void IDisk::copyThroughBuffers(
     WriteSettings write_settings,
     const std::function<void()> & cancellation_hook)
 {
-    ResultsCollector results;
-
-    SCOPE_EXIT_SAFE(
-        for (auto & result : results)
-            result.wait();
-        for (auto & result : results)
-            result.get();  /// May rethrow an exception
-    );
+    ThreadPoolCallbackRunnerLocal<void> runner(copying_thread_pool, "AsyncCopy");
 
     /// Disable parallel write. We already copy in parallel.
     /// Avoid high memory usage. See test_s3_zero_copy_ttl/test.py::test_move_and_s3_memory_usage
     write_settings.s3_allow_parallel_part_upload = false;
     write_settings.azure_allow_parallel_part_upload = false;
 
-    asyncCopy(*this, from_path, *to_disk, to_path, copying_thread_pool, results, copy_root_dir, read_settings, write_settings, cancellation_hook);
+    asyncCopy(*this, from_path, *to_disk, to_path, runner, copy_root_dir, read_settings, write_settings, cancellation_hook);
+
+    runner.waitForAllToFinishAndRethrowFirstError();
 }
 
 
From 82098e9882bb539a4397e9513c29f793f57d0ae4 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 8 May 2024 15:19:04 +0200
Subject: [PATCH 161/289] Fix stress test

---
 .../MergeTree/DataPartStorageOnDiskFull.cpp       | 15 ++++++++++++---
 .../MergeTree/DataPartStorageOnDiskFull.h         |  2 +-
 src/Storages/MergeTree/IDataPartStorage.h         |  2 +-
 src/Storages/MergeTree/checkDataPart.cpp          | 11 ++++++++++-
 4 files changed, 24 insertions(+), 6 deletions(-)

diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp b/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
index 94f636423cc..bfe656111b0 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
@@ -95,11 +95,20 @@ UInt32 DataPartStorageOnDiskFull::getRefCount(const String & file_name) const
     return volume->getDisk()->getRefCount(fs::path(root_path) / part_dir / file_name);
 }
 
-std::string DataPartStorageOnDiskFull::getRemotePath(const std::string & file_name) const
+std::string DataPartStorageOnDiskFull::getRemotePath(const std::string & file_name, bool if_exists) const
 {
-    auto objects = volume->getDisk()->getStorageObjects(fs::path(root_path) / part_dir / file_name);
+    const std::string path = fs::path(root_path) / part_dir / file_name;
+    auto objects = volume->getDisk()->getStorageObjects(path);
+
+    if (objects.empty() && if_exists)
+        return "";
+
     if (objects.size() != 1)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "One file must be mapped to one object on blob storage in MergeTree tables");
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "One file must be mapped to one object on blob storage by path {} in MergeTree tables, have {}.",
+                        path, objects.size());
+    }
 
     return objects[0].remote_path;
 }
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskFull.h b/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
index 15c6d42c721..15a6b75027d 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
@@ -23,7 +23,7 @@ public:
     Poco::Timestamp getFileLastModified(const String & file_name) const override;
     size_t getFileSize(const std::string & file_name) const override;
     UInt32 getRefCount(const std::string & file_name) const override;
-    std::string getRemotePath(const std::string & file_name) const override;
+    std::string getRemotePath(const std::string & file_name, bool is_exists) const override;
     String getUniqueId() const override;
 
     std::unique_ptr<ReadBufferFromFileBase> readFile(
diff --git a/src/Storages/MergeTree/IDataPartStorage.h b/src/Storages/MergeTree/IDataPartStorage.h
index d06d9791a53..91e005e403f 100644
--- a/src/Storages/MergeTree/IDataPartStorage.h
+++ b/src/Storages/MergeTree/IDataPartStorage.h
@@ -126,7 +126,7 @@ public:
     virtual UInt32 getRefCount(const std::string & file_name) const = 0;
 
     /// Get path on remote filesystem from file name on local filesystem.
-    virtual std::string getRemotePath(const std::string & file_name) const = 0;
+    virtual std::string getRemotePath(const std::string & file_name, bool if_exists) const = 0;
 
     virtual UInt64 calculateTotalSizeOnDisk() const = 0;
 
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index b4d32e71d0d..5b61412ca4d 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -377,7 +377,16 @@ IMergeTreeDataPart::Checksums checkDataPart(
             auto file_name = it->name();
             if (!data_part_storage.isDirectory(file_name))
             {
-                auto remote_path = data_part_storage.getRemotePath(file_name);
+                const bool is_projection_part = data_part->isProjectionPart();
+                auto remote_path = data_part_storage.getRemotePath(file_name, /* if_exists */is_projection_part);
+                if (remote_path.empty())
+                {
+                    chassert(is_projection_part);
+                    throw Exception(
+                        ErrorCodes::BROKEN_PROJECTION,
+                        "Remote path for {} does not exist for projection path. Projection {} is broken",
+                        file_name, data_part->name);
+                }
                 cache.removePathIfExists(remote_path, FileCache::getCommonUser().user_id);
             }
         }

From 1e036498260968f323bb50eabe0a0048416de334 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 8 May 2024 16:14:15 +0200
Subject: [PATCH 162/289] Revert "Fix index analysis for `DateTime64`"

---
 src/Functions/FunctionsConversion.cpp         |  2 +-
 .../02373_datetime64_monotonicity.queries     | 57 +++++++++++++++++++
 .../02373_datetime64_monotonicity.reference   | 12 ----
 .../02373_datetime64_monotonicity.sh          | 40 +------------
 ...tetime64_constant_index_analysis.reference |  6 --
 ...147_datetime64_constant_index_analysis.sql | 12 ----
 6 files changed, 59 insertions(+), 70 deletions(-)
 create mode 100644 tests/queries/0_stateless/02373_datetime64_monotonicity.queries
 delete mode 100644 tests/queries/0_stateless/03147_datetime64_constant_index_analysis.reference
 delete mode 100644 tests/queries/0_stateless/03147_datetime64_constant_index_analysis.sql

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 0da84d6d224..a16ce136b9a 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -4853,7 +4853,7 @@ FunctionBasePtr createFunctionBaseCast(
         DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256,
         DataTypeInt8, DataTypeInt16, DataTypeInt32, DataTypeInt64, DataTypeInt128, DataTypeInt256,
         DataTypeFloat32, DataTypeFloat64,
-        DataTypeDate, DataTypeDate32, DataTypeDateTime, DataTypeDateTime64,
+        DataTypeDate, DataTypeDate32, DataTypeDateTime,
         DataTypeString>(return_type.get(), [&](auto & type)
         {
             monotonicity = FunctionTo<std::decay_t<decltype(type)>>::Type::Monotonic::get;
diff --git a/tests/queries/0_stateless/02373_datetime64_monotonicity.queries b/tests/queries/0_stateless/02373_datetime64_monotonicity.queries
new file mode 100644
index 00000000000..404e3391205
--- /dev/null
+++ b/tests/queries/0_stateless/02373_datetime64_monotonicity.queries
@@ -0,0 +1,57 @@
+drop table if exists dt64_monot_test;
+drop table if exists dt64_monot_test_string;
+CREATE TABLE dt64_monot_test(`date_time` DateTime64(3, 'Europe/Berlin'), `id` String) ENGINE = MergeTree PARTITION BY toDate(date_time, 'Europe/Berlin') ORDER BY date_time;
+insert into dt64_monot_test select toDateTime64('2020-01-01 00:00:00.000',3)+number , '' from numbers(10);
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime(date_time) >= toDateTime('2020-01-01 00:00:00') SETTINGS force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count()　FROM dt64_monot_test WHERE toDateTime64(date_time, 3) >= '2020-01-01 00:00:01.111' SETTINGS force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time, 3) >= '2020-01-01 00:00:00.000' SETTINGS force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001', 3) SETTINGS force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001', 3, 'Europe/Berlin') SETTINGS force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001',6) SETTINGS force_index_by_date = 1; -- { serverError 277}
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001',6, 'Europe/Berlin') SETTINGS force_primary_key = 1; -- { serverError 277}
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001',6) SETTINGS force_primary_key = 1; -- { serverError 277}
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) <= toDateTime64('2020-01-01 00:00:00.000001',3, 'Europe/Berlin') settings force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) <= toDateTime64('2020-01-01 00:00:00.000001',3) settings force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) = toDateTime64('2020-01-01 00:00:00.000000',6);
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) = toDateTime64('2020-01-01 00:00:00.000000',6, 'Europe/Berlin');
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) = toDateTime64('2020-01-01 00:00:00.000000',6) settings force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) = toDateTime64('2020-01-01 00:00:00.000001',6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) > toDateTime64('2020-01-01 00:00:00.000001',6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) >= toDateTime64('2020-01-01 00:00:00.000001',6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) >= toDateTime64('2020-01-01 00:00:00.000001',6) settings force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,0) >= toDateTime64('2020-01-01 00:00:00.000001',0, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,0) >= toDateTime64('2020-01-01 00:00:00.000001',0) settings force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,0) >= '2020-01-01 00:00:00' settings force_index_by_date = 1, force_primary_key = 1;
+
+SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,0) >= '2020-01-01 00:00:01.1' settings force_index_by_date = 1, force_primary_key = 1;
+
+create table dt64_monot_test_string(date_time String, x String) Engine=MergeTree order by date_time;
+insert into dt64_monot_test_string select '2020-01-01 00:00:00.000000001', '' from numbers(1);
+insert into dt64_monot_test_string select '2020-01-01 00:00:00.000', '' from numbers(10);
+
+SELECT count() FROM dt64_monot_test_string WHERE toDateTime64(date_time,9) = '2020-01-01 00:00:00.000000000';
+SELECT count() FROM dt64_monot_test_string WHERE toDateTime64(date_time,3) = '2020-01-01 00:00:00.000000001';
+SELECT count() FROM dt64_monot_test_string WHERE toDateTime64(date_time,9) = '2020-01-01 00:00:00';
+
+drop table dt64_monot_test;
+drop table dt64_monot_test_string;
diff --git a/tests/queries/0_stateless/02373_datetime64_monotonicity.reference b/tests/queries/0_stateless/02373_datetime64_monotonicity.reference
index dd7ddf43e70..935ee685cc9 100644
--- a/tests/queries/0_stateless/02373_datetime64_monotonicity.reference
+++ b/tests/queries/0_stateless/02373_datetime64_monotonicity.reference
@@ -4,9 +4,6 @@ Asia/Tehran
 0
 10
 0
-9
-0
-9
 10
 1
 1
@@ -30,9 +27,6 @@ UTC
 10
 10
 10
-9
-10
-9
 0
 1
 1
@@ -56,9 +50,6 @@ Canada/Atlantic
 10
 10
 10
-9
-10
-9
 0
 1
 1
@@ -82,9 +73,6 @@ Europe/Berlin
 10
 10
 10
-9
-9
-9
 1
 1
 1
diff --git a/tests/queries/0_stateless/02373_datetime64_monotonicity.sh b/tests/queries/0_stateless/02373_datetime64_monotonicity.sh
index 7e852aa24b0..0e0dc0ec22a 100755
--- a/tests/queries/0_stateless/02373_datetime64_monotonicity.sh
+++ b/tests/queries/0_stateless/02373_datetime64_monotonicity.sh
@@ -7,44 +7,6 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 for tz in Asia/Tehran UTC Canada/Atlantic Europe/Berlin
 do
     echo "$tz"
-    TZ=$tz $CLICKHOUSE_LOCAL --multiline --multiquery "
-      drop table if exists dt64_monotonicity_test;
-      drop table if exists dt64_monotonicity_test_string;
-      CREATE TABLE dt64_monotonicity_test (date_time DateTime64(3, 'Europe/Berlin'), id String) ENGINE = MergeTree PARTITION BY toDate(date_time, 'Europe/Berlin') ORDER BY date_time;
-      insert into dt64_monotonicity_test select toDateTime64('2020-01-01 00:00:00.000', 3) + number, '' from numbers(10);
-
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime(date_time) >= toDateTime('2020-01-01 00:00:00') SETTINGS force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= '2020-01-01 00:00:01.111' SETTINGS force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= '2020-01-01 00:00:00.000' SETTINGS force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 3) SETTINGS force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 3, 'Europe/Berlin') SETTINGS force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 6) SETTINGS force_index_by_date = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 6, 'Europe/Berlin') SETTINGS force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 6) SETTINGS force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) <= toDateTime64('2020-01-01 00:00:00.000001', 3, 'Europe/Berlin') settings force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) <= toDateTime64('2020-01-01 00:00:00.000001', 3) settings force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) = toDateTime64('2020-01-01 00:00:00.000000', 6);
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) = toDateTime64('2020-01-01 00:00:00.000000', 6, 'Europe/Berlin');
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) = toDateTime64('2020-01-01 00:00:00.000000', 6) settings force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) = toDateTime64('2020-01-01 00:00:00.000001', 6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) > toDateTime64('2020-01-01 00:00:00.000001', 6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) >= toDateTime64('2020-01-01 00:00:00.000001', 6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) >= toDateTime64('2020-01-01 00:00:00.000001', 6) settings force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 0) >= toDateTime64('2020-01-01 00:00:00.000001', 0, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 0) >= toDateTime64('2020-01-01 00:00:00.000001', 0) settings force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 0) >= '2020-01-01 00:00:00' settings force_index_by_date = 1, force_primary_key = 1;
-      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 0) >= '2020-01-01 00:00:01.1' settings force_index_by_date = 1, force_primary_key = 1;
-
-      create table dt64_monotonicity_test_string(date_time String, x String) Engine=MergeTree order by date_time;
-      insert into dt64_monotonicity_test_string select '2020-01-01 00:00:00.000000001', '' from numbers(1);
-      insert into dt64_monotonicity_test_string select '2020-01-01 00:00:00.000', '' from numbers(10);
-
-      SELECT count() FROM dt64_monotonicity_test_string WHERE toDateTime64(date_time,9) = '2020-01-01 00:00:00.000000000';
-      SELECT count() FROM dt64_monotonicity_test_string WHERE toDateTime64(date_time,3) = '2020-01-01 00:00:00.000000001';
-      SELECT count() FROM dt64_monotonicity_test_string WHERE toDateTime64(date_time,9) = '2020-01-01 00:00:00';
-
-      drop table dt64_monotonicity_test;
-      drop table dt64_monotonicity_test_string;
-    "
+    TZ=$tz $CLICKHOUSE_LOCAL -mn < ${CUR_DIR}/02373_datetime64_monotonicity.queries
     echo ""
 done
diff --git a/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.reference b/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.reference
deleted file mode 100644
index 9abcce11136..00000000000
--- a/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.reference
+++ /dev/null
@@ -1,6 +0,0 @@
-7385
-7385
-7385
-7385
-86401
-86401
diff --git a/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.sql b/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.sql
deleted file mode 100644
index 144478eb721..00000000000
--- a/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.sql
+++ /dev/null
@@ -1,12 +0,0 @@
-DROP TABLE IF EXISTS test;
-CREATE TABLE test (d DateTime, PRIMARY KEY (d));
-INSERT INTO test SELECT toDateTime('2024-01-01') + number FROM numbers(1e6);
-SET max_rows_to_read = 10000;
-SELECT count() FROM test WHERE d <= '2024-01-01 02:03:04';
-SELECT count() FROM test WHERE d <= toDateTime('2024-01-01 02:03:04');
-SELECT count() FROM test WHERE d <= toDateTime64('2024-01-01 02:03:04', 0);
-SELECT count() FROM test WHERE d <= toDateTime64('2024-01-01 02:03:04', 3);
-SET max_rows_to_read = 100_000;
-SELECT count() FROM test WHERE d <= '2024-01-02';
-SELECT count() FROM test WHERE d <= toDate('2024-01-02');
-DROP TABLE test;

From f188866f958094799b8a61601404290672d0df7d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 8 May 2024 16:17:36 +0200
Subject: [PATCH 163/289] Part of #58061

---
 src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp                | 2 +-
 tests/queries/0_stateless/01473_event_time_microseconds.sql   | 2 +-
 .../0_stateless/02226_filesystem_cache_profile_events.sh      | 2 +-
 .../0_stateless/02241_filesystem_cache_on_write_operations.sh | 2 +-
 tests/queries/0_stateless/02244_hdfs_cluster.sql              | 2 +-
 tests/queries/0_stateless/02458_empty_hdfs_url.sql            | 4 ++--
 .../0_stateless/02458_hdfs_cluster_schema_inference.sql       | 3 +--
 .../02536_hdfs_cluster_use_structure_from_table.sql           | 3 +--
 tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql | 2 +-
 .../queries/0_stateless/02919_skip_lots_of_parsing_errors.sh  | 3 +--
 10 files changed, 11 insertions(+), 14 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp b/src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp
index e36459b019f..e492ca0aec2 100644
--- a/src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexAnnoy.cpp
@@ -28,7 +28,7 @@ namespace ErrorCodes
 
 template <typename Distance>
 AnnoyIndexWithSerialization<Distance>::AnnoyIndexWithSerialization(size_t dimensions)
-    : Base::AnnoyIndex(dimensions)
+    : Base::AnnoyIndex(static_cast<int>(dimensions))
 {
 }
 
diff --git a/tests/queries/0_stateless/01473_event_time_microseconds.sql b/tests/queries/0_stateless/01473_event_time_microseconds.sql
index 2b443cf82eb..7803c1e2e30 100644
--- a/tests/queries/0_stateless/01473_event_time_microseconds.sql
+++ b/tests/queries/0_stateless/01473_event_time_microseconds.sql
@@ -1,4 +1,4 @@
--- Tags: no-tsan, no-asan, no-ubsan, no-msan, no-debug, no-cpu-aarch64
+-- Tags: no-tsan, no-asan, no-ubsan, no-msan, no-debug
 
 -- This file contains tests for the event_time_microseconds field for various tables.
 -- Note: Only event_time_microseconds for asynchronous_metric_log table is tested via
diff --git a/tests/queries/0_stateless/02226_filesystem_cache_profile_events.sh b/tests/queries/0_stateless/02226_filesystem_cache_profile_events.sh
index 02e98bbb1b0..9d87542d84d 100755
--- a/tests/queries/0_stateless/02226_filesystem_cache_profile_events.sh
+++ b/tests/queries/0_stateless/02226_filesystem_cache_profile_events.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-fasttest, no-parallel, no-s3-storage, no-random-settings, no-cpu-aarch64, no-replicated-database
+# Tags: no-fasttest, no-parallel, no-s3-storage, no-random-settings, no-replicated-database
 
 # set -x
 
diff --git a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
index ee1d942a421..c1d930f54a7 100755
--- a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
+++ b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-fasttest, no-parallel, no-s3-storage, no-random-settings, no-cpu-aarch64
+# Tags: long, no-fasttest, no-parallel, no-s3-storage, no-random-settings
 
 # set -x
 
diff --git a/tests/queries/0_stateless/02244_hdfs_cluster.sql b/tests/queries/0_stateless/02244_hdfs_cluster.sql
index ffd4a35a506..fcd47d316be 100644
--- a/tests/queries/0_stateless/02244_hdfs_cluster.sql
+++ b/tests/queries/0_stateless/02244_hdfs_cluster.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-parallel, no-cpu-aarch64
+-- Tags: no-fasttest, no-parallel
 -- Tag no-fasttest: Depends on Java
 
 insert into table function hdfs('hdfs://localhost:12222/test_1.tsv', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32') select 1, 2, 3 settings hdfs_truncate_on_insert=1;
diff --git a/tests/queries/0_stateless/02458_empty_hdfs_url.sql b/tests/queries/0_stateless/02458_empty_hdfs_url.sql
index ccc554fc628..9b51740b63d 100644
--- a/tests/queries/0_stateless/02458_empty_hdfs_url.sql
+++ b/tests/queries/0_stateless/02458_empty_hdfs_url.sql
@@ -1,5 +1,5 @@
--- Tags: no-fasttest, no-cpu-aarch64
+-- Tags: no-fasttest
 SELECT * FROM hdfsCluster('test_shard_localhost', '', 'TSV'); -- { serverError BAD_ARGUMENTS }
 SELECT * FROM hdfsCluster('test_shard_localhost', ' ', 'TSV'); -- { serverError BAD_ARGUMENTS }
 SELECT * FROM hdfsCluster('test_shard_localhost', '/', 'TSV'); -- { serverError BAD_ARGUMENTS }
-SELECT * FROM hdfsCluster('test_shard_localhost', 'http/', 'TSV'); -- { serverError BAD_ARGUMENTS }
\ No newline at end of file
+SELECT * FROM hdfsCluster('test_shard_localhost', 'http/', 'TSV'); -- { serverError BAD_ARGUMENTS }
diff --git a/tests/queries/0_stateless/02458_hdfs_cluster_schema_inference.sql b/tests/queries/0_stateless/02458_hdfs_cluster_schema_inference.sql
index 42e88fc44b2..deac4165e94 100644
--- a/tests/queries/0_stateless/02458_hdfs_cluster_schema_inference.sql
+++ b/tests/queries/0_stateless/02458_hdfs_cluster_schema_inference.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-parallel, no-cpu-aarch64
+-- Tags: no-fasttest, no-parallel
 -- Tag no-fasttest: Depends on Java
 
 insert into table function hdfs('hdfs://localhost:12222/test_02458_1.tsv', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32') select 1, 2, 3 settings hdfs_truncate_on_insert=1;
@@ -9,4 +9,3 @@ desc hdfsCluster('test_cluster_one_shard_three_replicas_localhost', 'hdfs://loca
 
 select * from hdfsCluster('test_cluster_one_shard_three_replicas_localhost', 'hdfs://localhost:12222/test_02458_{1,2}.tsv') order by c1, c2, c3;
 select * from hdfsCluster('test_cluster_one_shard_three_replicas_localhost', 'hdfs://localhost:12222/test_02458_{1,2}.tsv', 'TSV') order by c1, c2, c3;
-
diff --git a/tests/queries/0_stateless/02536_hdfs_cluster_use_structure_from_table.sql b/tests/queries/0_stateless/02536_hdfs_cluster_use_structure_from_table.sql
index 5d624efc5a9..a395e451f39 100644
--- a/tests/queries/0_stateless/02536_hdfs_cluster_use_structure_from_table.sql
+++ b/tests/queries/0_stateless/02536_hdfs_cluster_use_structure_from_table.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-parallel, no-cpu-aarch64
+-- Tags: no-fasttest, no-parallel
 -- Tag no-fasttest: Depends on Java
 
 insert into table function hdfs('hdfs://localhost:12222/test_02536.jsonl', 'TSV') select '{"x" : {"a" : 1, "b" : 2}}' settings hdfs_truncate_on_insert=1;
@@ -9,4 +9,3 @@ insert into test select * from hdfsCluster('test_cluster_two_shards_localhost',
 insert into test select * from hdfsCluster('test_cluster_two_shards_localhost', 'hdfs://localhost:12222/test_02536.jsonl') settings use_structure_from_insertion_table_in_table_functions=1;
 select * from test;
 drop table test;
-
diff --git a/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql b/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
index 88561f9d895..1c714e34174 100644
--- a/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
+++ b/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-cpu-aarch64, no-msan
+-- Tags: no-fasttest, no-msan
 
 drop table if exists dummy;
 CREATE TABLE dummy ( num1 Int32, num2 Enum8('foo' = 0, 'bar' = 1, 'tar' = 2) )
diff --git a/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.sh b/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.sh
index 7ddb55fb39b..64fef943958 100755
--- a/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.sh
+++ b/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-fasttest, no-cpu-aarch64
+# Tags: no-fasttest
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -20,4 +20,3 @@ $CLICKHOUSE_LOCAL -q "select count() from file('$ERRORS_FILE', CSV)"
 rm $ERRORS_FILE
 
 rm $FILE
-

From 5885f4263b1ce20db4d5cfa5ed61ec427852471c Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 8 May 2024 17:20:38 +0300
Subject: [PATCH 164/289] Recursive CTE documentation fix

---
 docs/en/sql-reference/statements/select/with.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/en/sql-reference/statements/select/with.md b/docs/en/sql-reference/statements/select/with.md
index ffde7a3fe54..aa0e0c61c4e 100644
--- a/docs/en/sql-reference/statements/select/with.md
+++ b/docs/en/sql-reference/statements/select/with.md
@@ -88,7 +88,7 @@ WITH test1 AS (SELECT i + 1, j + 1 FROM test1)
 SELECT * FROM test1;
 ```
 
-# Recursive Queries
+## Recursive Queries
 
 The optional RECURSIVE modifier allows for a WITH query to refer to its own output. Example:
 
@@ -159,7 +159,7 @@ SELECT * FROM search_tree;
 └────┴───────────┴───────────┘
 ```
 
-## Search order
+### Search order
 
 To create a depth-first order, we compute for each result row an array of rows that we have already visited:
 
@@ -211,7 +211,7 @@ SELECT * FROM search_tree ORDER BY depth;
 └────┴──────┴───────────┴─────────┴───────┘
 ```
 
-## Cycle detection
+### Cycle detection
 
 First let's create graph table:
 
@@ -291,7 +291,7 @@ SELECT * FROM search_graph WHERE is_cycle ORDER BY from;
 └──────┴────┴────────┴──────────┴───────────────────────────┘
 ```
 
-## Infinite queries
+### Infinite queries
 
 It is also possible to use infinite recursive CTE queries if `LIMIT` is used in outer query:
 

From a08a07723bbac42e980e5ff836958e070c69cf4c Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Wed, 8 May 2024 16:26:03 +0200
Subject: [PATCH 165/289] Update clickhouse-test

---
 tests/clickhouse-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 35568ace72f..97459bd5b69 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -908,7 +908,7 @@ class MergeTreeSettingsRandomizer:
         ),
         "cache_populated_by_fetch": lambda: random.randint(0, 1),
         "concurrent_part_removal_threshold": threshold_generator(0.2, 0.3, 0, 100),
-        "old_parts_lifetime": threshold_generator(0.2, 0.3, 30, 8 * 60),
+        "old_parts_lifetime": threshold_generator(0.2, 0.3, 10, 8 * 60),
     }
 
     @staticmethod

From caa150510426e1d4b3a6af18f0107175b24989da Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 8 May 2024 16:43:05 +0200
Subject: [PATCH 166/289] Update 02240_system_filesystem_cache_table.sh

---
 tests/queries/0_stateless/02240_system_filesystem_cache_table.sh | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/02240_system_filesystem_cache_table.sh b/tests/queries/0_stateless/02240_system_filesystem_cache_table.sh
index 6a94cffea5a..9aa631c5d0a 100755
--- a/tests/queries/0_stateless/02240_system_filesystem_cache_table.sh
+++ b/tests/queries/0_stateless/02240_system_filesystem_cache_table.sh
@@ -9,7 +9,6 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 
 for STORAGE_POLICY in 's3_cache' 'local_cache'; do
     echo "Using storage policy: $STORAGE_POLICY"
-    ${CLICKHOUSE_CLIENT} --query "SYSTEM STOP MERGES"
     ${CLICKHOUSE_CLIENT} --query "SYSTEM DROP FILESYSTEM CACHE"
     ${CLICKHOUSE_CLIENT} --query "SYSTEM DROP MARK CACHE"
     ${CLICKHOUSE_CLIENT} --query "SELECT count() FROM system.filesystem_cache"

From 7eb5c9354bf0cdf9bad1e56e78bcf03fdae77444 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 8 May 2024 16:44:37 +0200
Subject: [PATCH 167/289] Revert "Revert "Fix index analysis for `DateTime64`""

---
 src/Functions/FunctionsConversion.cpp         |  2 +-
 .../02373_datetime64_monotonicity.queries     | 57 -------------------
 .../02373_datetime64_monotonicity.reference   | 12 ++++
 .../02373_datetime64_monotonicity.sh          | 40 ++++++++++++-
 ...tetime64_constant_index_analysis.reference |  6 ++
 ...147_datetime64_constant_index_analysis.sql | 12 ++++
 6 files changed, 70 insertions(+), 59 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02373_datetime64_monotonicity.queries
 create mode 100644 tests/queries/0_stateless/03147_datetime64_constant_index_analysis.reference
 create mode 100644 tests/queries/0_stateless/03147_datetime64_constant_index_analysis.sql

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index a16ce136b9a..0da84d6d224 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -4853,7 +4853,7 @@ FunctionBasePtr createFunctionBaseCast(
         DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256,
         DataTypeInt8, DataTypeInt16, DataTypeInt32, DataTypeInt64, DataTypeInt128, DataTypeInt256,
         DataTypeFloat32, DataTypeFloat64,
-        DataTypeDate, DataTypeDate32, DataTypeDateTime,
+        DataTypeDate, DataTypeDate32, DataTypeDateTime, DataTypeDateTime64,
         DataTypeString>(return_type.get(), [&](auto & type)
         {
             monotonicity = FunctionTo<std::decay_t<decltype(type)>>::Type::Monotonic::get;
diff --git a/tests/queries/0_stateless/02373_datetime64_monotonicity.queries b/tests/queries/0_stateless/02373_datetime64_monotonicity.queries
deleted file mode 100644
index 404e3391205..00000000000
--- a/tests/queries/0_stateless/02373_datetime64_monotonicity.queries
+++ /dev/null
@@ -1,57 +0,0 @@
-drop table if exists dt64_monot_test;
-drop table if exists dt64_monot_test_string;
-CREATE TABLE dt64_monot_test(`date_time` DateTime64(3, 'Europe/Berlin'), `id` String) ENGINE = MergeTree PARTITION BY toDate(date_time, 'Europe/Berlin') ORDER BY date_time;
-insert into dt64_monot_test select toDateTime64('2020-01-01 00:00:00.000',3)+number , '' from numbers(10);
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime(date_time) >= toDateTime('2020-01-01 00:00:00') SETTINGS force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count()　FROM dt64_monot_test WHERE toDateTime64(date_time, 3) >= '2020-01-01 00:00:01.111' SETTINGS force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time, 3) >= '2020-01-01 00:00:00.000' SETTINGS force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001', 3) SETTINGS force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001', 3, 'Europe/Berlin') SETTINGS force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001',6) SETTINGS force_index_by_date = 1; -- { serverError 277}
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001',6, 'Europe/Berlin') SETTINGS force_primary_key = 1; -- { serverError 277}
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) >= toDateTime64('2020-01-01 00:00:00.000001',6) SETTINGS force_primary_key = 1; -- { serverError 277}
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) <= toDateTime64('2020-01-01 00:00:00.000001',3, 'Europe/Berlin') settings force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) <= toDateTime64('2020-01-01 00:00:00.000001',3) settings force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) = toDateTime64('2020-01-01 00:00:00.000000',6);
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,3) = toDateTime64('2020-01-01 00:00:00.000000',6, 'Europe/Berlin');
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) = toDateTime64('2020-01-01 00:00:00.000000',6) settings force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) = toDateTime64('2020-01-01 00:00:00.000001',6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) > toDateTime64('2020-01-01 00:00:00.000001',6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) >= toDateTime64('2020-01-01 00:00:00.000001',6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,6) >= toDateTime64('2020-01-01 00:00:00.000001',6) settings force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,0) >= toDateTime64('2020-01-01 00:00:00.000001',0, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,0) >= toDateTime64('2020-01-01 00:00:00.000001',0) settings force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,0) >= '2020-01-01 00:00:00' settings force_index_by_date = 1, force_primary_key = 1;
-
-SELECT count() FROM dt64_monot_test WHERE toDateTime64(date_time,0) >= '2020-01-01 00:00:01.1' settings force_index_by_date = 1, force_primary_key = 1;
-
-create table dt64_monot_test_string(date_time String, x String) Engine=MergeTree order by date_time;
-insert into dt64_monot_test_string select '2020-01-01 00:00:00.000000001', '' from numbers(1);
-insert into dt64_monot_test_string select '2020-01-01 00:00:00.000', '' from numbers(10);
-
-SELECT count() FROM dt64_monot_test_string WHERE toDateTime64(date_time,9) = '2020-01-01 00:00:00.000000000';
-SELECT count() FROM dt64_monot_test_string WHERE toDateTime64(date_time,3) = '2020-01-01 00:00:00.000000001';
-SELECT count() FROM dt64_monot_test_string WHERE toDateTime64(date_time,9) = '2020-01-01 00:00:00';
-
-drop table dt64_monot_test;
-drop table dt64_monot_test_string;
diff --git a/tests/queries/0_stateless/02373_datetime64_monotonicity.reference b/tests/queries/0_stateless/02373_datetime64_monotonicity.reference
index 935ee685cc9..dd7ddf43e70 100644
--- a/tests/queries/0_stateless/02373_datetime64_monotonicity.reference
+++ b/tests/queries/0_stateless/02373_datetime64_monotonicity.reference
@@ -4,6 +4,9 @@ Asia/Tehran
 0
 10
 0
+9
+0
+9
 10
 1
 1
@@ -27,6 +30,9 @@ UTC
 10
 10
 10
+9
+10
+9
 0
 1
 1
@@ -50,6 +56,9 @@ Canada/Atlantic
 10
 10
 10
+9
+10
+9
 0
 1
 1
@@ -73,6 +82,9 @@ Europe/Berlin
 10
 10
 10
+9
+9
+9
 1
 1
 1
diff --git a/tests/queries/0_stateless/02373_datetime64_monotonicity.sh b/tests/queries/0_stateless/02373_datetime64_monotonicity.sh
index 0e0dc0ec22a..7e852aa24b0 100755
--- a/tests/queries/0_stateless/02373_datetime64_monotonicity.sh
+++ b/tests/queries/0_stateless/02373_datetime64_monotonicity.sh
@@ -7,6 +7,44 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 for tz in Asia/Tehran UTC Canada/Atlantic Europe/Berlin
 do
     echo "$tz"
-    TZ=$tz $CLICKHOUSE_LOCAL -mn < ${CUR_DIR}/02373_datetime64_monotonicity.queries
+    TZ=$tz $CLICKHOUSE_LOCAL --multiline --multiquery "
+      drop table if exists dt64_monotonicity_test;
+      drop table if exists dt64_monotonicity_test_string;
+      CREATE TABLE dt64_monotonicity_test (date_time DateTime64(3, 'Europe/Berlin'), id String) ENGINE = MergeTree PARTITION BY toDate(date_time, 'Europe/Berlin') ORDER BY date_time;
+      insert into dt64_monotonicity_test select toDateTime64('2020-01-01 00:00:00.000', 3) + number, '' from numbers(10);
+
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime(date_time) >= toDateTime('2020-01-01 00:00:00') SETTINGS force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= '2020-01-01 00:00:01.111' SETTINGS force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= '2020-01-01 00:00:00.000' SETTINGS force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 3) SETTINGS force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 3, 'Europe/Berlin') SETTINGS force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 6) SETTINGS force_index_by_date = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 6, 'Europe/Berlin') SETTINGS force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) >= toDateTime64('2020-01-01 00:00:00.000001', 6) SETTINGS force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) <= toDateTime64('2020-01-01 00:00:00.000001', 3, 'Europe/Berlin') settings force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) <= toDateTime64('2020-01-01 00:00:00.000001', 3) settings force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) = toDateTime64('2020-01-01 00:00:00.000000', 6);
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 3) = toDateTime64('2020-01-01 00:00:00.000000', 6, 'Europe/Berlin');
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) = toDateTime64('2020-01-01 00:00:00.000000', 6) settings force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) = toDateTime64('2020-01-01 00:00:00.000001', 6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) > toDateTime64('2020-01-01 00:00:00.000001', 6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) >= toDateTime64('2020-01-01 00:00:00.000001', 6, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 6) >= toDateTime64('2020-01-01 00:00:00.000001', 6) settings force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 0) >= toDateTime64('2020-01-01 00:00:00.000001', 0, 'Europe/Berlin') settings force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 0) >= toDateTime64('2020-01-01 00:00:00.000001', 0) settings force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 0) >= '2020-01-01 00:00:00' settings force_index_by_date = 1, force_primary_key = 1;
+      SELECT count() FROM dt64_monotonicity_test WHERE toDateTime64(date_time, 0) >= '2020-01-01 00:00:01.1' settings force_index_by_date = 1, force_primary_key = 1;
+
+      create table dt64_monotonicity_test_string(date_time String, x String) Engine=MergeTree order by date_time;
+      insert into dt64_monotonicity_test_string select '2020-01-01 00:00:00.000000001', '' from numbers(1);
+      insert into dt64_monotonicity_test_string select '2020-01-01 00:00:00.000', '' from numbers(10);
+
+      SELECT count() FROM dt64_monotonicity_test_string WHERE toDateTime64(date_time,9) = '2020-01-01 00:00:00.000000000';
+      SELECT count() FROM dt64_monotonicity_test_string WHERE toDateTime64(date_time,3) = '2020-01-01 00:00:00.000000001';
+      SELECT count() FROM dt64_monotonicity_test_string WHERE toDateTime64(date_time,9) = '2020-01-01 00:00:00';
+
+      drop table dt64_monotonicity_test;
+      drop table dt64_monotonicity_test_string;
+    "
     echo ""
 done
diff --git a/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.reference b/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.reference
new file mode 100644
index 00000000000..9abcce11136
--- /dev/null
+++ b/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.reference
@@ -0,0 +1,6 @@
+7385
+7385
+7385
+7385
+86401
+86401
diff --git a/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.sql b/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.sql
new file mode 100644
index 00000000000..144478eb721
--- /dev/null
+++ b/tests/queries/0_stateless/03147_datetime64_constant_index_analysis.sql
@@ -0,0 +1,12 @@
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (d DateTime, PRIMARY KEY (d));
+INSERT INTO test SELECT toDateTime('2024-01-01') + number FROM numbers(1e6);
+SET max_rows_to_read = 10000;
+SELECT count() FROM test WHERE d <= '2024-01-01 02:03:04';
+SELECT count() FROM test WHERE d <= toDateTime('2024-01-01 02:03:04');
+SELECT count() FROM test WHERE d <= toDateTime64('2024-01-01 02:03:04', 0);
+SELECT count() FROM test WHERE d <= toDateTime64('2024-01-01 02:03:04', 3);
+SET max_rows_to_read = 100_000;
+SELECT count() FROM test WHERE d <= '2024-01-02';
+SELECT count() FROM test WHERE d <= toDate('2024-01-02');
+DROP TABLE test;

From 3b318fb3c6d2145b4d69e00b0312cc8e72fcef49 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 7 May 2024 20:46:17 +0200
Subject: [PATCH 168/289] Fix for RabbitMQ

---
 src/Storages/RabbitMQ/StorageRabbitMQ.cpp     | 160 ++++++++++--------
 src/Storages/RabbitMQ/StorageRabbitMQ.h       |   1 -
 .../integration/test_storage_rabbitmq/test.py |   2 +-
 3 files changed, 94 insertions(+), 69 deletions(-)

diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index b882fd2728c..5dc882e953f 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -402,9 +402,7 @@ void StorageRabbitMQ::initRabbitMQ()
 
         /// Main exchange -> Bridge exchange -> ( Sharding exchange ) -> Queues -> Consumers
 
-        initExchange(*rabbit_channel);
         bindExchange(*rabbit_channel);
-
         for (const auto i : collections::range(0, num_queues))
             bindQueue(i + 1, *rabbit_channel);
 
@@ -436,7 +434,7 @@ void StorageRabbitMQ::initRabbitMQ()
 }
 
 
-void StorageRabbitMQ::initExchange(AMQP::TcpChannel & rabbit_channel)
+void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
 {
     /// Exchange hierarchy:
     /// 1. Main exchange (defined with table settings - rabbitmq_exchange_name, rabbitmq_exchange_type).
@@ -449,68 +447,78 @@ void StorageRabbitMQ::initExchange(AMQP::TcpChannel & rabbit_channel)
     /// 1. `durable` (survive RabbitMQ server restart)
     /// 2. `autodelete` (auto delete in case of queue bindings are dropped).
 
+    std::string error;
+    int error_code;
     rabbit_channel.declareExchange(exchange_name, exchange_type, AMQP::durable)
     .onError([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /// This error can be a result of attempt to declare exchange if it was already declared but
         /// 1) with different exchange type.
         /// 2) with different exchange settings.
-        throw Exception(ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-                "Unable to declare exchange. Make sure specified exchange is not already declared. Error: {}",
-                std::string(message));
+        error = "Unable to declare exchange. "
+            "Make sure specified exchange is not already declared. Error: " + std::string(message);
+        error_code = ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE;
     });
 
     rabbit_channel.declareExchange(bridge_exchange, AMQP::fanout, AMQP::durable | AMQP::autodelete)
     .onError([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /// This error is not supposed to happen as this exchange name is always unique to type and its settings.
-        throw Exception(
-                        ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-                        "Unable to declare bridge exchange ({}). Reason: {}", bridge_exchange, std::string(message));
+        if (error.empty())
+        {
+            error = fmt::format("Unable to declare bridge exchange ({}). Reason: {}",
+                                bridge_exchange, std::string(message));
+            error_code = ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE;
+        }
     });
 
-    if (!hash_exchange)
+    if (hash_exchange)
+    {
+        AMQP::Table binding_arguments;
+
+        /// Default routing key property in case of hash exchange is a routing key, which is required to be an integer.
+        /// Support for arbitrary exchange type (i.e. arbitrary pattern of routing keys) requires to eliminate this dependency.
+        /// This settings changes hash property to message_id.
+        binding_arguments["hash-property"] = "message_id";
+
+        /// Declare hash exchange for sharding.
+        rabbit_channel.declareExchange(sharding_exchange, AMQP::consistent_hash, AMQP::durable | AMQP::autodelete, binding_arguments)
+        .onError([&](const char * message)
+        {
+            connection->getHandler().stopLoop();
+            /// This error can be a result of same reasons as above for exchange_name, i.e. it will mean that sharding exchange name appeared
+            /// to be the same as some other exchange (which purpose is not for sharding). So probably actual error reason: queue_base parameter
+            /// is bad.
+            if (error.empty())
+            {
+                error = fmt::format("Unable to declare sharding exchange ({}). Reason: {}",
+                                    sharding_exchange, std::string(message));
+                error_code = ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE;
+            }
+        });
+
+        rabbit_channel.bindExchange(bridge_exchange, sharding_exchange, routing_keys[0])
+        .onError([&](const char * message)
+        {
+            connection->getHandler().stopLoop();
+            if (error.empty())
+            {
+                error = fmt::format(
+                    "Unable to bind bridge exchange ({}) to sharding exchange ({}). Reason: {}",
+                    bridge_exchange, sharding_exchange, std::string(message));
+                error_code = ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE;
+            }
+        });
+
+        consumer_exchange = sharding_exchange;
+    }
+    else
     {
         consumer_exchange = bridge_exchange;
-        return;
     }
 
-    AMQP::Table binding_arguments;
-
-    /// Default routing key property in case of hash exchange is a routing key, which is required to be an integer.
-    /// Support for arbitrary exchange type (i.e. arbitrary pattern of routing keys) requires to eliminate this dependency.
-    /// This settings changes hash property to message_id.
-    binding_arguments["hash-property"] = "message_id";
-
-    /// Declare hash exchange for sharding.
-    rabbit_channel.declareExchange(sharding_exchange, AMQP::consistent_hash, AMQP::durable | AMQP::autodelete, binding_arguments)
-    .onError([&](const char * message)
-    {
-        /// This error can be a result of same reasons as above for exchange_name, i.e. it will mean that sharding exchange name appeared
-        /// to be the same as some other exchange (which purpose is not for sharding). So probably actual error reason: queue_base parameter
-        /// is bad.
-        throw Exception(
-           ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-           "Unable to declare sharding exchange ({}). Reason: {}", sharding_exchange, std::string(message));
-    });
-
-    rabbit_channel.bindExchange(bridge_exchange, sharding_exchange, routing_keys[0])
-    .onError([&](const char * message)
-    {
-        throw Exception(
-            ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-            "Unable to bind bridge exchange ({}) to sharding exchange ({}). Reason: {}",
-            bridge_exchange,
-            sharding_exchange,
-            std::string(message));
-    });
-
-    consumer_exchange = sharding_exchange;
-}
-
-
-void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
-{
     size_t bound_keys = 0;
 
     if (exchange_type == AMQP::ExchangeType::headers)
@@ -527,10 +535,10 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
         .onSuccess([&]() { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                exchange_name, bridge_exchange, std::string(message));
+            connection->getHandler().stopLoop();
+            error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                exchange_name, bridge_exchange, std::string(message));
+            error_code = ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE;
         });
     }
     else if (exchange_type == AMQP::ExchangeType::fanout || exchange_type == AMQP::ExchangeType::consistent_hash)
@@ -539,10 +547,13 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
         .onSuccess([&]() { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                exchange_name, bridge_exchange, std::string(message));
+            connection->getHandler().stopLoop();
+            if (error.empty())
+            {
+                error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                    exchange_name, bridge_exchange, std::string(message));
+                error_code = ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE;
+            }
         });
     }
     else
@@ -558,20 +569,26 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
             })
             .onError([&](const char * message)
             {
-                throw Exception(
-                    ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                    "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                    exchange_name, bridge_exchange, std::string(message));
+                connection->getHandler().stopLoop();
+                if (error.empty())
+                {
+                    error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                        exchange_name, bridge_exchange, std::string(message));
+                    error_code = ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE;
+                }
             });
         }
     }
 
     connection->getHandler().startBlockingLoop();
+    if (!error.empty())
+        throw Exception(error_code, "{}", error);
 }
 
 
 void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_channel)
 {
+    std::string error;
     auto success_callback = [&](const std::string &  queue_name, int msgcount, int /* consumercount */)
     {
         queues.emplace_back(queue_name);
@@ -588,23 +605,26 @@ void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_chann
         .onSuccess([&] { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_CREATE_RABBITMQ_QUEUE_BINDING,
-                "Failed to create queue binding for exchange {}. Reason: {}", exchange_name, std::string(message));
+            connection->getHandler().stopLoop();
+            error = fmt::format("Failed to create queue binding for exchange {}. Reason: {}",
+                                exchange_name, std::string(message));
         });
     };
 
     auto error_callback([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /* This error is most likely a result of an attempt to declare queue with different settings if it was declared before. So for a
          * given queue name either deadletter_exchange parameter changed or queue_size changed, i.e. table was declared with different
          * max_block_size parameter. Solution: client should specify a different queue_base parameter or manually delete previously
          * declared queues via any of the various cli tools.
          */
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Failed to declare queue. Probably queue settings are conflicting: "
-                        "max_block_size, deadletter_exchange. Attempt specifying differently those settings "
-                        "or use a different queue_base or manually delete previously declared queues, "
-                        "which  were declared with the same names. ERROR reason: {}", std::string(message));
+         if (error.empty())
+             error = fmt::format(
+                 "Failed to declare queue. Probably queue settings are conflicting: "
+                 "max_block_size, deadletter_exchange. Attempt specifying differently those settings "
+                 "or use a different queue_base or manually delete previously declared queues, "
+                 "which  were declared with the same names. ERROR reason: {}", std::string(message));
     });
 
     AMQP::Table queue_settings;
@@ -642,6 +662,8 @@ void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_chann
     /// and deleting queues should not take place.
     rabbit_channel.declareQueue(queue_name, AMQP::durable, queue_settings).onSuccess(success_callback).onError(error_callback);
     connection->getHandler().startBlockingLoop();
+    if (!error.empty())
+        throw Exception(ErrorCodes::CANNOT_CREATE_RABBITMQ_QUEUE_BINDING, "{}", error);
 }
 
 
@@ -665,6 +687,7 @@ void StorageRabbitMQ::unbindExchange()
 
             stopLoop();
             looping_task->deactivate();
+            std::string error;
 
             auto rabbit_channel = connection->createChannel();
             rabbit_channel->removeExchange(bridge_exchange)
@@ -674,11 +697,14 @@ void StorageRabbitMQ::unbindExchange()
             })
             .onError([&](const char * message)
             {
-                throw Exception(ErrorCodes::CANNOT_REMOVE_RABBITMQ_EXCHANGE, "Unable to remove exchange. Reason: {}", std::string(message));
+                connection->getHandler().stopLoop();
+                error = fmt::format("Unable to remove exchange. Reason: {}", std::string(message));
             });
 
             connection->getHandler().startBlockingLoop();
             rabbit_channel->close();
+            if (!error.empty())
+                throw Exception(ErrorCodes::CANNOT_REMOVE_RABBITMQ_EXCHANGE, "{}", error);
         }
         catch (...)
         {
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.h b/src/Storages/RabbitMQ/StorageRabbitMQ.h
index e14741d9636..30cfd335f71 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.h
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.h
@@ -181,7 +181,6 @@ private:
     void initRabbitMQ();
     void cleanupRabbitMQ() const;
 
-    void initExchange(AMQP::TcpChannel & rabbit_channel);
     void bindExchange(AMQP::TcpChannel & rabbit_channel);
     void bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_channel);
 
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 1017e58e50c..63fd3315816 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -2606,7 +2606,7 @@ def test_rabbitmq_bad_args(rabbitmq_cluster):
     connection = pika.BlockingConnection(parameters)
     channel = connection.channel()
     channel.exchange_declare(exchange="f", exchange_type="fanout")
-    instance.query_and_get_error(
+    assert "Unable to declare exchange" in instance.query_and_get_error(
         """
         CREATE TABLE test.drop (key UInt64, value UInt64)
             ENGINE = RabbitMQ

From c2b84431114cf71074923fd7e30f2891ec6a249c Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 7 May 2024 20:46:17 +0200
Subject: [PATCH 169/289] Fix for RabbitMQ

---
 src/Storages/RabbitMQ/StorageRabbitMQ.cpp     | 160 ++++++++++--------
 src/Storages/RabbitMQ/StorageRabbitMQ.h       |   1 -
 .../integration/test_storage_rabbitmq/test.py |   2 +-
 3 files changed, 94 insertions(+), 69 deletions(-)

diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index 0358b2bbc66..e4b19992151 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -408,9 +408,7 @@ void StorageRabbitMQ::initRabbitMQ()
 
         /// Main exchange -> Bridge exchange -> ( Sharding exchange ) -> Queues -> Consumers
 
-        initExchange(*rabbit_channel);
         bindExchange(*rabbit_channel);
-
         for (const auto i : collections::range(0, num_queues))
             bindQueue(i + 1, *rabbit_channel);
 
@@ -442,7 +440,7 @@ void StorageRabbitMQ::initRabbitMQ()
 }
 
 
-void StorageRabbitMQ::initExchange(AMQP::TcpChannel & rabbit_channel)
+void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
 {
     /// Exchange hierarchy:
     /// 1. Main exchange (defined with table settings - rabbitmq_exchange_name, rabbitmq_exchange_type).
@@ -455,68 +453,78 @@ void StorageRabbitMQ::initExchange(AMQP::TcpChannel & rabbit_channel)
     /// 1. `durable` (survive RabbitMQ server restart)
     /// 2. `autodelete` (auto delete in case of queue bindings are dropped).
 
+    std::string error;
+    int error_code;
     rabbit_channel.declareExchange(exchange_name, exchange_type, AMQP::durable)
     .onError([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /// This error can be a result of attempt to declare exchange if it was already declared but
         /// 1) with different exchange type.
         /// 2) with different exchange settings.
-        throw Exception(ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-                "Unable to declare exchange. Make sure specified exchange is not already declared. Error: {}",
-                std::string(message));
+        error = "Unable to declare exchange. "
+            "Make sure specified exchange is not already declared. Error: " + std::string(message);
+        error_code = ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE;
     });
 
     rabbit_channel.declareExchange(bridge_exchange, AMQP::fanout, AMQP::durable | AMQP::autodelete)
     .onError([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /// This error is not supposed to happen as this exchange name is always unique to type and its settings.
-        throw Exception(
-                        ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-                        "Unable to declare bridge exchange ({}). Reason: {}", bridge_exchange, std::string(message));
+        if (error.empty())
+        {
+            error = fmt::format("Unable to declare bridge exchange ({}). Reason: {}",
+                                bridge_exchange, std::string(message));
+            error_code = ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE;
+        }
     });
 
-    if (!hash_exchange)
+    if (hash_exchange)
+    {
+        AMQP::Table binding_arguments;
+
+        /// Default routing key property in case of hash exchange is a routing key, which is required to be an integer.
+        /// Support for arbitrary exchange type (i.e. arbitrary pattern of routing keys) requires to eliminate this dependency.
+        /// This settings changes hash property to message_id.
+        binding_arguments["hash-property"] = "message_id";
+
+        /// Declare hash exchange for sharding.
+        rabbit_channel.declareExchange(sharding_exchange, AMQP::consistent_hash, AMQP::durable | AMQP::autodelete, binding_arguments)
+        .onError([&](const char * message)
+        {
+            connection->getHandler().stopLoop();
+            /// This error can be a result of same reasons as above for exchange_name, i.e. it will mean that sharding exchange name appeared
+            /// to be the same as some other exchange (which purpose is not for sharding). So probably actual error reason: queue_base parameter
+            /// is bad.
+            if (error.empty())
+            {
+                error = fmt::format("Unable to declare sharding exchange ({}). Reason: {}",
+                                    sharding_exchange, std::string(message));
+                error_code = ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE;
+            }
+        });
+
+        rabbit_channel.bindExchange(bridge_exchange, sharding_exchange, routing_keys[0])
+        .onError([&](const char * message)
+        {
+            connection->getHandler().stopLoop();
+            if (error.empty())
+            {
+                error = fmt::format(
+                    "Unable to bind bridge exchange ({}) to sharding exchange ({}). Reason: {}",
+                    bridge_exchange, sharding_exchange, std::string(message));
+                error_code = ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE;
+            }
+        });
+
+        consumer_exchange = sharding_exchange;
+    }
+    else
     {
         consumer_exchange = bridge_exchange;
-        return;
     }
 
-    AMQP::Table binding_arguments;
-
-    /// Default routing key property in case of hash exchange is a routing key, which is required to be an integer.
-    /// Support for arbitrary exchange type (i.e. arbitrary pattern of routing keys) requires to eliminate this dependency.
-    /// This settings changes hash property to message_id.
-    binding_arguments["hash-property"] = "message_id";
-
-    /// Declare hash exchange for sharding.
-    rabbit_channel.declareExchange(sharding_exchange, AMQP::consistent_hash, AMQP::durable | AMQP::autodelete, binding_arguments)
-    .onError([&](const char * message)
-    {
-        /// This error can be a result of same reasons as above for exchange_name, i.e. it will mean that sharding exchange name appeared
-        /// to be the same as some other exchange (which purpose is not for sharding). So probably actual error reason: queue_base parameter
-        /// is bad.
-        throw Exception(
-           ErrorCodes::CANNOT_DECLARE_RABBITMQ_EXCHANGE,
-           "Unable to declare sharding exchange ({}). Reason: {}", sharding_exchange, std::string(message));
-    });
-
-    rabbit_channel.bindExchange(bridge_exchange, sharding_exchange, routing_keys[0])
-    .onError([&](const char * message)
-    {
-        throw Exception(
-            ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-            "Unable to bind bridge exchange ({}) to sharding exchange ({}). Reason: {}",
-            bridge_exchange,
-            sharding_exchange,
-            std::string(message));
-    });
-
-    consumer_exchange = sharding_exchange;
-}
-
-
-void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
-{
     size_t bound_keys = 0;
 
     if (exchange_type == AMQP::ExchangeType::headers)
@@ -533,10 +541,10 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
         .onSuccess([&]() { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                exchange_name, bridge_exchange, std::string(message));
+            connection->getHandler().stopLoop();
+            error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                exchange_name, bridge_exchange, std::string(message));
+            error_code = ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE;
         });
     }
     else if (exchange_type == AMQP::ExchangeType::fanout || exchange_type == AMQP::ExchangeType::consistent_hash)
@@ -545,10 +553,13 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
         .onSuccess([&]() { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                exchange_name, bridge_exchange, std::string(message));
+            connection->getHandler().stopLoop();
+            if (error.empty())
+            {
+                error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                    exchange_name, bridge_exchange, std::string(message));
+                error_code = ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE;
+            }
         });
     }
     else
@@ -564,20 +575,26 @@ void StorageRabbitMQ::bindExchange(AMQP::TcpChannel & rabbit_channel)
             })
             .onError([&](const char * message)
             {
-                throw Exception(
-                    ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE,
-                    "Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
-                    exchange_name, bridge_exchange, std::string(message));
+                connection->getHandler().stopLoop();
+                if (error.empty())
+                {
+                    error = fmt::format("Unable to bind exchange {} to bridge exchange ({}). Reason: {}",
+                                        exchange_name, bridge_exchange, std::string(message));
+                    error_code = ErrorCodes::CANNOT_BIND_RABBITMQ_EXCHANGE;
+                }
             });
         }
     }
 
     connection->getHandler().startBlockingLoop();
+    if (!error.empty())
+        throw Exception(error_code, "{}", error);
 }
 
 
 void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_channel)
 {
+    std::string error;
     auto success_callback = [&](const std::string &  queue_name, int msgcount, int /* consumercount */)
     {
         queues.emplace_back(queue_name);
@@ -594,23 +611,26 @@ void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_chann
         .onSuccess([&] { connection->getHandler().stopLoop(); })
         .onError([&](const char * message)
         {
-            throw Exception(
-                ErrorCodes::CANNOT_CREATE_RABBITMQ_QUEUE_BINDING,
-                "Failed to create queue binding for exchange {}. Reason: {}", exchange_name, std::string(message));
+            connection->getHandler().stopLoop();
+            error = fmt::format("Failed to create queue binding for exchange {}. Reason: {}",
+                                exchange_name, std::string(message));
         });
     };
 
     auto error_callback([&](const char * message)
     {
+        connection->getHandler().stopLoop();
         /* This error is most likely a result of an attempt to declare queue with different settings if it was declared before. So for a
          * given queue name either deadletter_exchange parameter changed or queue_size changed, i.e. table was declared with different
          * max_block_size parameter. Solution: client should specify a different queue_base parameter or manually delete previously
          * declared queues via any of the various cli tools.
          */
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Failed to declare queue. Probably queue settings are conflicting: "
-                        "max_block_size, deadletter_exchange. Attempt specifying differently those settings "
-                        "or use a different queue_base or manually delete previously declared queues, "
-                        "which  were declared with the same names. ERROR reason: {}", std::string(message));
+         if (error.empty())
+             error = fmt::format(
+                 "Failed to declare queue. Probably queue settings are conflicting: "
+                 "max_block_size, deadletter_exchange. Attempt specifying differently those settings "
+                 "or use a different queue_base or manually delete previously declared queues, "
+                 "which  were declared with the same names. ERROR reason: {}", std::string(message));
     });
 
     AMQP::Table queue_settings;
@@ -648,6 +668,8 @@ void StorageRabbitMQ::bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_chann
     /// and deleting queues should not take place.
     rabbit_channel.declareQueue(queue_name, AMQP::durable, queue_settings).onSuccess(success_callback).onError(error_callback);
     connection->getHandler().startBlockingLoop();
+    if (!error.empty())
+        throw Exception(ErrorCodes::CANNOT_CREATE_RABBITMQ_QUEUE_BINDING, "{}", error);
 }
 
 
@@ -671,6 +693,7 @@ void StorageRabbitMQ::unbindExchange()
 
             stopLoop();
             looping_task->deactivate();
+            std::string error;
 
             auto rabbit_channel = connection->createChannel();
             rabbit_channel->removeExchange(bridge_exchange)
@@ -680,11 +703,14 @@ void StorageRabbitMQ::unbindExchange()
             })
             .onError([&](const char * message)
             {
-                throw Exception(ErrorCodes::CANNOT_REMOVE_RABBITMQ_EXCHANGE, "Unable to remove exchange. Reason: {}", std::string(message));
+                connection->getHandler().stopLoop();
+                error = fmt::format("Unable to remove exchange. Reason: {}", std::string(message));
             });
 
             connection->getHandler().startBlockingLoop();
             rabbit_channel->close();
+            if (!error.empty())
+                throw Exception(ErrorCodes::CANNOT_REMOVE_RABBITMQ_EXCHANGE, "{}", error);
         }
         catch (...)
         {
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.h b/src/Storages/RabbitMQ/StorageRabbitMQ.h
index 59fab7cd1ea..b8fab5825e4 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.h
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.h
@@ -183,7 +183,6 @@ private:
     void initRabbitMQ();
     void cleanupRabbitMQ() const;
 
-    void initExchange(AMQP::TcpChannel & rabbit_channel);
     void bindExchange(AMQP::TcpChannel & rabbit_channel);
     void bindQueue(size_t queue_id, AMQP::TcpChannel & rabbit_channel);
 
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index f8e785d5ce6..23a95d5dd71 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -2606,7 +2606,7 @@ def test_rabbitmq_bad_args(rabbitmq_cluster):
     connection = pika.BlockingConnection(parameters)
     channel = connection.channel()
     channel.exchange_declare(exchange="f", exchange_type="fanout")
-    instance.query_and_get_error(
+    assert "Unable to declare exchange" in instance.query_and_get_error(
         """
         CREATE TABLE test.drop (key UInt64, value UInt64)
             ENGINE = RabbitMQ

From 071ff50d204bf5c7454c760fac3966dbc77c6145 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 8 May 2024 17:08:12 +0200
Subject: [PATCH 170/289] Fix data race inside distributed sink

---
 src/Storages/Distributed/DistributedSink.cpp | 9 +++++++++
 src/Storages/Distributed/DistributedSink.h   | 2 ++
 2 files changed, 11 insertions(+)

diff --git a/src/Storages/Distributed/DistributedSink.cpp b/src/Storages/Distributed/DistributedSink.cpp
index b89a8d7bcfd..96313e333bf 100644
--- a/src/Storages/Distributed/DistributedSink.cpp
+++ b/src/Storages/Distributed/DistributedSink.cpp
@@ -436,6 +436,10 @@ DistributedSink::runWritingJob(JobReplica & job, const Block & current_block, si
 
 void DistributedSink::writeSync(const Block & block)
 {
+    std::lock_guard lock(execution_mutex);
+    if (isCancelled())
+        return;
+
     OpenTelemetry::SpanHolder span(__PRETTY_FUNCTION__);
 
     const Settings & settings = context->getSettingsRef();
@@ -537,6 +541,10 @@ void DistributedSink::onFinish()
         LOG_DEBUG(log, "It took {} sec. to insert {} blocks, {} rows per second. {}", elapsed, inserted_blocks, inserted_rows / elapsed, getCurrentStateDescription());
     };
 
+    std::lock_guard lock(execution_mutex);
+    if (isCancelled())
+        return;
+
     /// Pool finished means that some exception had been thrown before,
     /// and scheduling new jobs will return "Cannot schedule a task" error.
     if (insert_sync && pool && !pool->finished())
@@ -587,6 +595,7 @@ void DistributedSink::onFinish()
 
 void DistributedSink::onCancel()
 {
+    std::lock_guard lock(execution_mutex);
     if (pool && !pool->finished())
     {
         try
diff --git a/src/Storages/Distributed/DistributedSink.h b/src/Storages/Distributed/DistributedSink.h
index 7a9e89c9e94..a4c95633595 100644
--- a/src/Storages/Distributed/DistributedSink.h
+++ b/src/Storages/Distributed/DistributedSink.h
@@ -113,6 +113,8 @@ private:
     std::optional<ThreadPool> pool;
     ThrottlerPtr throttler;
 
+    std::mutex execution_mutex;
+
     struct JobReplica
     {
         JobReplica() = default;

From 96dd6c03cd513b1a1d733fec80b5c547b96e050b Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 8 May 2024 18:01:47 +0200
Subject: [PATCH 171/289] Update
 src/Storages/MergeTree/DataPartStorageOnDiskFull.h

Co-authored-by: SmitaRKulkarni <Smita.Kulkarni@clickhouse.com>
---
 src/Storages/MergeTree/DataPartStorageOnDiskFull.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskFull.h b/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
index 15a6b75027d..ba787809b63 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
@@ -23,7 +23,7 @@ public:
     Poco::Timestamp getFileLastModified(const String & file_name) const override;
     size_t getFileSize(const std::string & file_name) const override;
     UInt32 getRefCount(const std::string & file_name) const override;
-    std::string getRemotePath(const std::string & file_name, bool is_exists) const override;
+    std::string getRemotePath(const std::string & file_name, bool if_exists) const override;
     String getUniqueId() const override;
 
     std::unique_ptr<ReadBufferFromFileBase> readFile(

From bbb8cc0e9321ed8091c54ad1302fab0fe786930b Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 8 May 2024 18:01:50 +0200
Subject: [PATCH 172/289] Fix azure tests run on master

---
 tests/ci/ci.py              | 9 ++++++---
 tests/ci/test_ci_options.py | 7 ++++---
 2 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index a95ada628ff..6d821af32c1 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -849,6 +849,7 @@ class CiOptions:
         jobs_to_do: List[str],
         jobs_to_skip: List[str],
         jobs_params: Dict[str, Dict[str, Any]],
+        pr_info: PRInfo,
     ) -> Tuple[List[str], List[str], Dict[str, Dict[str, Any]]]:
         """
         Applies specified options on CI Run Config
@@ -948,7 +949,8 @@ class CiOptions:
                     jobs_params[job] = {
                         "batches": list(range(num_batches)),
                         "num_batches": num_batches,
-                        "run_if_ci_option_include_set": job_config.run_by_ci_option,
+                        "run_if_ci_option_include_set": job_config.run_by_ci_option
+                        and pr_info.is_pr,
                     }
 
         # 4. Handle "batch_" tags
@@ -1439,7 +1441,8 @@ def _configure_jobs(
             jobs_params[job] = {
                 "batches": batches_to_do,
                 "num_batches": num_batches,
-                "run_if_ci_option_include_set": job_config.run_by_ci_option,
+                "run_if_ci_option_include_set": job_config.run_by_ci_option
+                and pr_info.is_pr,
             }
         elif add_to_skip:
             # treat job as being skipped only if it's controlled by digest
@@ -1464,7 +1467,7 @@ def _configure_jobs(
                 ]
 
     jobs_to_do, jobs_to_skip, jobs_params = ci_options.apply(
-        jobs_to_do, jobs_to_skip, jobs_params
+        jobs_to_do, jobs_to_skip, jobs_params, pr_info
     )
 
     return {
diff --git a/tests/ci/test_ci_options.py b/tests/ci/test_ci_options.py
index 3d9c02822bd..0f10f7d4f85 100644
--- a/tests/ci/test_ci_options.py
+++ b/tests/ci/test_ci_options.py
@@ -4,6 +4,7 @@
 
 import unittest
 from ci import CiOptions
+from pr_info import PRInfo
 
 _TEST_BODY_1 = """
 #### Run only:
@@ -164,7 +165,7 @@ class TestCIOptions(unittest.TestCase):
             }
         }
         jobs_to_do, jobs_to_skip, job_params = ci_options.apply(
-            jobs_to_do, jobs_to_skip, job_params
+            jobs_to_do, jobs_to_skip, job_params, PRInfo()
         )
         self.assertCountEqual(
             jobs_to_do,
@@ -196,7 +197,7 @@ class TestCIOptions(unittest.TestCase):
         jobs_to_skip = []
         job_params = {}
         jobs_to_do, jobs_to_skip, job_params = ci_options.apply(
-            jobs_to_do, jobs_to_skip, job_params
+            jobs_to_do, jobs_to_skip, job_params, PRInfo()
         )
         self.assertCountEqual(
             jobs_to_do,
@@ -231,7 +232,7 @@ class TestCIOptions(unittest.TestCase):
                 job_params[job] = {"run_if_ci_option_include_set": False}
 
         jobs_to_do, jobs_to_skip, job_params = ci_options.apply(
-            jobs_to_do, jobs_to_skip, job_params
+            jobs_to_do, jobs_to_skip, job_params, PRInfo()
         )
         self.assertNotIn(
             "Stateless tests (azure, asan)",

From b2828fc852bd9f31aac388bc16064312f2d56161 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 8 May 2024 16:06:38 +0000
Subject: [PATCH 173/289] Search nullable GB keys from all the parent scopes.

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp            | 12 ++++++++----
 ...023_group_by_use_nulls_analyzer_crashes.reference |  7 +++++++
 .../03023_group_by_use_nulls_analyzer_crashes.sql    |  6 ++++++
 3 files changed, 21 insertions(+), 4 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 426f3b6bde8..62e469e545a 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -6518,11 +6518,15 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
 
     if (!scope.expressions_in_resolve_process_stack.hasAggregateFunction())
     {
-        auto it = scope.nullable_group_by_keys.find(node);
-        if (it != scope.nullable_group_by_keys.end())
+        for (const auto * scope_ptr = &scope; scope_ptr; scope_ptr = scope_ptr->parent_scope)
         {
-            node = it->node->clone();
-            node->convertToNullable();
+            auto it = scope_ptr->nullable_group_by_keys.find(node);
+            if (it != scope_ptr->nullable_group_by_keys.end())
+            {
+                node = it->node->clone();
+                node->convertToNullable();
+                break;
+            }
         }
     }
 
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
index 273e1567a9b..c2dcb613411 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
@@ -96,3 +96,10 @@ a	a
 ['.','.','.','.','.','.','.']
 ['.','.','.','.','.','.','.','.']
 ['.','.','.','.','.','.','.','.','.']
+[]
+[]
+[]
+[]
+[]
+[]
+[]
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
index 33ad527772b..deb6382aa36 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
@@ -47,3 +47,9 @@ SETTINGS group_by_use_nulls = 1;
 SELECT arrayMap(x -> '.', range(number % 10)) AS k FROM remote('127.0.0.{2,3}', numbers(10)) GROUP BY GROUPING SETS ((k)) ORDER BY k settings group_by_use_nulls=1;
 
 SELECT count('Lambda as function parameter') AS c FROM (SELECT ignore(ignore('Lambda as function parameter', 28, 28, 28, 28, 28, 28), 28), materialize('Lambda as function parameter'), 28, 28, 'world', 5 FROM system.numbers WHERE ignore(materialize('Lambda as function parameter'), materialize(toLowCardinality(28)), 28, 28, 28, 28, toUInt128(28)) LIMIT 2) GROUP BY GROUPING SETS ((toLowCardinality(0)), (toLowCardinality(toNullable(28))), (1)) HAVING nullIf(c, 10) < 50 ORDER BY c ASC NULLS FIRST settings group_by_use_nulls=1; -- { serverError ILLEGAL_AGGREGATION }
+
+SELECT arraySplit(x -> 0, []) WHERE materialize(1) GROUP BY (0, ignore('a')) WITH ROLLUP SETTINGS group_by_use_nulls = 1;
+
+SELECT arraySplit(x -> toUInt8(number), []) from numbers(1) GROUP BY toUInt8(number) WITH ROLLUP SETTINGS group_by_use_nulls = 1;
+
+SELECT arraySplit(number -> toUInt8(number), []) from numbers(1) GROUP BY toUInt8(number) WITH ROLLUP SETTINGS group_by_use_nulls = 1;

From ff810ceb39a5a5942617bc453854dfc49c9cbb19 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 8 May 2024 16:50:42 +0000
Subject: [PATCH 174/289] Try another fix and add simplier test.

---
 src/Storages/MergeTree/IMergeTreeReader.cpp      | 12 +++---------
 src/Storages/MergeTree/MergeTreeRangeReader.cpp  | 16 ++++++++--------
 .../MergeTree/MergeTreeSequentialSource.cpp      |  4 ++--
 .../03144_alter_column_and_read.reference        | 10 ++++++++++
 .../0_stateless/03144_alter_column_and_read.sql  | 11 +++++++++++
 5 files changed, 34 insertions(+), 19 deletions(-)
 create mode 100644 tests/queries/0_stateless/03144_alter_column_and_read.reference
 create mode 100644 tests/queries/0_stateless/03144_alter_column_and_read.sql

diff --git a/src/Storages/MergeTree/IMergeTreeReader.cpp b/src/Storages/MergeTree/IMergeTreeReader.cpp
index 54da03d1756..4ad7f6ef991 100644
--- a/src/Storages/MergeTree/IMergeTreeReader.cpp
+++ b/src/Storages/MergeTree/IMergeTreeReader.cpp
@@ -152,14 +152,7 @@ void IMergeTreeReader::evaluateMissingDefaults(Block additional_columns, Columns
             if (res_columns[pos] == nullptr)
                 continue;
 
-            /// We must take column type from part if it exists. Because at the end of defaults
-            /// calculations we will materialize ALL the columns, not only missing.
-            /// If column doesn't exist in part than it will be substituted with default expression
-            const auto * column_in_part = part_columns.tryGet(name_and_type->name);
-            if (column_in_part != nullptr)
-                additional_columns.insert({res_columns[pos], column_in_part->type, name_and_type->name});
-            else
-                additional_columns.insert({res_columns[pos], name_and_type->type, name_and_type->name});
+            additional_columns.insert({res_columns[pos], name_and_type->type, name_and_type->name});
         }
 
         auto dag = DB::evaluateMissingDefaults(
@@ -271,7 +264,8 @@ void IMergeTreeReader::performRequiredConversions(Columns & res_columns) const
         /// Move columns from block.
         name_and_type = requested_columns.begin();
         for (size_t pos = 0; pos < num_columns; ++pos, ++name_and_type)
-            res_columns[pos] = std::move(copy_block.getByName(name_and_type->name).column);
+            if (copy_block.has(name_and_type->name))
+                res_columns[pos] = std::move(copy_block.getByName(name_and_type->name).column);
     }
     catch (Exception & e)
     {
diff --git a/src/Storages/MergeTree/MergeTreeRangeReader.cpp b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
index eb757e1d8c7..84f18b0e47b 100644
--- a/src/Storages/MergeTree/MergeTreeRangeReader.cpp
+++ b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
@@ -1007,6 +1007,10 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
                 filterColumns(columns, read_result.final_filter);
             }
 
+            /// If columns not empty, then apply on-fly alter conversions if any required
+            if (!prewhere_info || prewhere_info->perform_alter_conversions)
+                merge_tree_reader->performRequiredConversions(columns);
+
             /// If some columns absent in part, then evaluate default values
             if (should_evaluate_missing_defaults)
             {
@@ -1017,10 +1021,6 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
                 addDummyColumnWithRowCount(additional_columns, read_result.num_rows);
                 merge_tree_reader->evaluateMissingDefaults(additional_columns, columns);
             }
-
-            /// If columns not empty, then apply on-fly alter conversions if any required
-            if (!prewhere_info || prewhere_info->perform_alter_conversions)
-                merge_tree_reader->performRequiredConversions(columns);
         }
 
         read_result.columns.reserve(read_result.columns.size() + columns.size());
@@ -1046,14 +1046,14 @@ MergeTreeRangeReader::ReadResult MergeTreeRangeReader::read(size_t max_rows, Mar
             bool should_evaluate_missing_defaults;
             merge_tree_reader->fillMissingColumns(columns, should_evaluate_missing_defaults, read_result.num_rows);
 
-            /// If some columns absent in part, then evaluate default values
-            if (should_evaluate_missing_defaults)
-                merge_tree_reader->evaluateMissingDefaults({}, columns);
-
             /// If result not empty, then apply on-fly alter conversions if any required
             if (!prewhere_info || prewhere_info->perform_alter_conversions)
                 merge_tree_reader->performRequiredConversions(columns);
 
+            /// If some columns absent in part, then evaluate default values
+            if (should_evaluate_missing_defaults)
+                merge_tree_reader->evaluateMissingDefaults({}, columns);
+
             for (size_t i = 0; i < columns.size(); ++i)
                 read_result.columns[i] = std::move(columns[i]);
         }
diff --git a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
index c022cfe3861..a041579f8f8 100644
--- a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
@@ -251,11 +251,11 @@ try
             bool should_evaluate_missing_defaults = false;
             reader->fillMissingColumns(columns, should_evaluate_missing_defaults, rows_read);
 
+            reader->performRequiredConversions(columns);
+
             if (should_evaluate_missing_defaults)
                 reader->evaluateMissingDefaults({}, columns);
 
-            reader->performRequiredConversions(columns);
-
             /// Reorder columns and fill result block.
             size_t num_columns = sample.size();
             Columns res_columns;
diff --git a/tests/queries/0_stateless/03144_alter_column_and_read.reference b/tests/queries/0_stateless/03144_alter_column_and_read.reference
new file mode 100644
index 00000000000..3e1271d6ed7
--- /dev/null
+++ b/tests/queries/0_stateless/03144_alter_column_and_read.reference
@@ -0,0 +1,10 @@
+0	0_42
+1	1_42
+2	2_42
+3	3_42
+4	4_42
+5	5_42
+6	6_42
+7	7_42
+8	8_42
+9	9_42
diff --git a/tests/queries/0_stateless/03144_alter_column_and_read.sql b/tests/queries/0_stateless/03144_alter_column_and_read.sql
new file mode 100644
index 00000000000..d198c3447b1
--- /dev/null
+++ b/tests/queries/0_stateless/03144_alter_column_and_read.sql
@@ -0,0 +1,11 @@
+drop table if exists tab;
+create table tab (x UInt32) engine = MergeTree order by tuple();
+
+insert into tab select number from numbers(10);
+
+set alter_sync = 0;
+alter table tab update x = x + sleepEachRow(0.1) where 1;
+alter table tab modify column x String;
+alter table tab add column y String default x || '_42';
+
+select x, y from tab order by x;

From 8d2fcbd91de9311286b1bc8fff78dc415d2b6f44 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 8 May 2024 18:50:46 +0200
Subject: [PATCH 175/289] Remove check

---
 tests/config/install.sh | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/tests/config/install.sh b/tests/config/install.sh
index 33dcac9d2c7..6536683b6c2 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -181,11 +181,8 @@ elif [[ "$USE_AZURE_STORAGE_FOR_MERGE_TREE" == "1" ]]; then
     ln -sf $SRC_PATH/config.d/azure_storage_policy_by_default.xml $DEST_SERVER_PATH/config.d/
 fi
 
-ARM="aarch64"
-OS="$(uname -m)"
 if [[ -n "$EXPORT_S3_STORAGE_POLICIES" ]]; then
-    echo "$OS"
-    if [[ "$USE_DATABASE_REPLICATED" -eq 1 ]] || [[ "$OS" == "$ARM" ]]; then
+    if [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
         echo "Azure configuration will not be added"
     else
         echo "Adding azure configuration"

From e146262ccf8a11b6c065428eb89aab61ddd44b63 Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Wed, 8 May 2024 19:57:46 +0300
Subject: [PATCH 176/289] Deleted setting max_bytes_in_join by
 default_max_bytes

---
 src/Interpreters/HashJoin.cpp | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 55c2be7d5db..33ba1fd2201 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -833,10 +833,6 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
 
     size_t max_bytes_in_join = table_join->sizeLimits().max_bytes;
     size_t max_rows_in_join = table_join->sizeLimits().max_rows;
-    if (!table_join->sizeLimits().hasLimits())
-    {
-        max_bytes_in_join = table_join->defaultMaxBytes();
-    }
 
     if (kind == JoinKind::Cross && tmp_data
         && (tmp_stream || (max_bytes_in_join && getTotalByteCount() + block_to_save.allocatedBytes() >= max_bytes_in_join)

From 47473d77abca5887914d4f703961ffbbb72000cf Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 8 May 2024 20:31:02 +0200
Subject: [PATCH 177/289] Find a proper commit for cumulative `A Sync` status

---
 tests/ci/ci.py | 64 +++++++++++++++++++++++++++++++++++++-------------
 1 file changed, 48 insertions(+), 16 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 01179f84763..fe68dc32b79 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -14,6 +14,8 @@ from enum import Enum
 from pathlib import Path
 from typing import Any, Dict, List, Optional, Sequence, Set, Tuple, Union
 
+from github.CommitStatus import CommitStatus
+
 import docker_images_helper
 import upload_result_helper
 from build_check import get_release_or_pr
@@ -1908,6 +1910,51 @@ def _get_ext_check_name(check_name: str) -> str:
     return check_name_with_group
 
 
+def update_upstream_a_sync(
+    pr_info: PRInfo,
+    gh: GitHub,
+    mergeable_status: CommitStatus,
+) -> None:
+    pr_number = int(pr_info.head_ref.split("/pr/", maxsplit=1)[1])
+    upstream_repo = gh.get_repo(GITHUB_UPSTREAM_REPOSITORY)
+    upstream_pr = upstream_repo.get_pull(pr_number)
+    sync_repo = gh.get_repo(GITHUB_REPOSITORY)
+    sync_pr = sync_repo.get_pull(pr_info.number)
+    # Find the commit that is in both repos, upstream and cloud
+    sync_commits = sync_pr.get_commits().reversed
+    upstream_commits = upstream_pr.get_commits()
+    # Github objects are compared by _url attribute. We can't compare them directly and
+    # should compare commits by SHA1
+    upstream_shas = [uc.sha for uc in upstream_commits]
+    found = False
+    for commit in sync_commits:
+        try:
+            idx = upstream_shas.index(commit.sha)
+            found = True
+            upstream_commit = upstream_commits[idx]
+        except ValueError:
+            continue
+
+    if not found:
+        print(
+            "No same commits found in upstream and sync repo, most probably force-push"
+        )
+        return
+
+    post_commit_status(
+        upstream_commit,
+        get_status(mergeable_status.state),
+        "",  # let's won't expose any urls from cloud
+        mergeable_status.description,
+        StatusNames.SYNC,
+    )
+    trigger_mergeable_check(
+        upstream_commit,
+        get_commit_filtered_statuses(upstream_commit),
+        True,
+    )
+
+
 def main() -> int:
     logging.basicConfig(level=logging.INFO)
     exit_code = 0
@@ -2204,23 +2251,8 @@ def main() -> int:
                         and mergeable_status
                         and GITHUB_REPOSITORY != GITHUB_UPSTREAM_REPOSITORY
                     ):
+                        update_upstream_a_sync(pr_info, gh, mergeable_status)
                         pr_number = int(pr_info.head_ref.split("/pr/", maxsplit=1)[1])
-                        upstream_repo = gh.get_repo(GITHUB_UPSTREAM_REPOSITORY)
-                        head_sha = upstream_repo.get_pull(pr_number).head.sha
-                        upstream_commit = upstream_repo.get_commit(head_sha)
-                        post_commit_status(
-                            upstream_commit,
-                            get_status(mergeable_status.state),
-                            "",  # let's won't expose any urls from cloud
-                            mergeable_status.description,
-                            StatusNames.SYNC,
-                        )
-                        trigger_mergeable_check(
-                            upstream_commit,
-                            get_commit_filtered_statuses(upstream_commit),
-                            True,
-                        )
-
                         prepared_events = prepare_tests_results_for_clickhouse(
                             pr_info,
                             [],

From 4cb64d3b68d45e9c18228efefe9084819992820c Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 8 May 2024 21:26:02 +0200
Subject: [PATCH 178/289] Trigger Build


From afda3c24e48a1ff1375c3a84e958273fe92d015b Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Wed, 8 May 2024 19:41:41 +0000
Subject: [PATCH 179/289] Add no-s3-storage tag to local_plain_rewritable ut

This blacklists the test in the distributed cache build.
---
 tests/queries/0_stateless/03008_local_plain_rewritable.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03008_local_plain_rewritable.sh b/tests/queries/0_stateless/03008_local_plain_rewritable.sh
index 07fd013c911..77bc6763fd8 100755
--- a/tests/queries/0_stateless/03008_local_plain_rewritable.sh
+++ b/tests/queries/0_stateless/03008_local_plain_rewritable.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-random-settings, no-replicated-database, no-shared-merge-tree
+# Tags: no-random-settings, no-s3-storage, no-replicated-database, no-shared-merge-tree
 # Tag no-random-settings: enable after root causing flakiness
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From b25defe17a552fe82e8710c43a91da3707fde57b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 8 May 2024 22:38:52 +0200
Subject: [PATCH 180/289] Fixing some clang-tidy warnings

---
 base/base/JSON.cpp                 |  4 +++-
 base/base/JSON.h                   |  2 +-
 base/base/find_symbols.h           |  2 +-
 base/base/hex.h                    |  8 +++++---
 base/base/iostream_debug_helpers.h | 30 +++++++++++++++++-------------
 base/base/itoa.cpp                 |  6 ++++--
 base/base/range.h                  | 14 ++++++--------
 base/base/sleep.cpp                |  4 +++-
 base/base/wide_integer.h           | 10 ++++++----
 base/base/wide_integer_impl.h      |  3 ++-
 src/Common/StackTrace.h            |  2 +-
 11 files changed, 49 insertions(+), 36 deletions(-)

diff --git a/base/base/JSON.cpp b/base/base/JSON.cpp
index 9da059c98b6..a68b6663e50 100644
--- a/base/base/JSON.cpp
+++ b/base/base/JSON.cpp
@@ -651,7 +651,9 @@ std::string_view JSON::getRawString() const
     Pos s = ptr_begin;
     if (*s != '"')
         throw JSONException(std::string("JSON: expected \", got ") + *s);
-    while (++s != ptr_end && *s != '"');
+    ++s;
+    while (s != ptr_end && *s != '"')
+        ++s;
     if (s != ptr_end)
         return std::string_view(ptr_begin + 1, s - ptr_begin - 1);
     throw JSONException("JSON: incorrect syntax (expected end of string, found end of JSON).");
diff --git a/base/base/JSON.h b/base/base/JSON.h
index bc053670a96..7b9acf11d9a 100644
--- a/base/base/JSON.h
+++ b/base/base/JSON.h
@@ -74,7 +74,7 @@ public:
     const char * data() const { return ptr_begin; }
     const char * dataEnd() const { return ptr_end; }
 
-    enum ElementType
+    enum ElementType : uint8_t
     {
         TYPE_OBJECT,
         TYPE_ARRAY,
diff --git a/base/base/find_symbols.h b/base/base/find_symbols.h
index fda94edaa88..30ee759ba33 100644
--- a/base/base/find_symbols.h
+++ b/base/base/find_symbols.h
@@ -147,7 +147,7 @@ constexpr uint16_t maybe_negate(uint16_t x)
         return ~x;
 }
 
-enum class ReturnMode
+enum class ReturnMode : uint8_t
 {
     End,
     Nullptr,
diff --git a/base/base/hex.h b/base/base/hex.h
index 931f220aa08..d2ebcadbe56 100644
--- a/base/base/hex.h
+++ b/base/base/hex.h
@@ -176,17 +176,19 @@ namespace impl
     };
 
     /// Helper template class to convert a value of any supported type to hexadecimal representation and back.
-    template <typename T, typename SFINAE = void>
+    template <typename T>
     struct HexConversion;
 
     template <typename TUInt>
-    struct HexConversion<TUInt, std::enable_if_t<std::is_integral_v<TUInt>>> : public HexConversionUInt<TUInt> {};
+    requires(std::is_integral_v<TUInt>)
+    struct HexConversion<TUInt> : public HexConversionUInt<TUInt> {};
 
     template <size_t Bits, typename Signed>
     struct HexConversion<wide::integer<Bits, Signed>> : public HexConversionUInt<wide::integer<Bits, Signed>> {};
 
     template <typename CityHashUInt128> /// Partial specialization here allows not to include <city.h> in this header.
-    struct HexConversion<CityHashUInt128, std::enable_if_t<std::is_same_v<CityHashUInt128, typename CityHash_v1_0_2::uint128>>>
+    requires(std::is_same_v<CityHashUInt128, typename CityHash_v1_0_2::uint128>)
+    struct HexConversion<CityHashUInt128>
     {
         static const constexpr size_t num_hex_digits = 32;
 
diff --git a/base/base/iostream_debug_helpers.h b/base/base/iostream_debug_helpers.h
index 5c601251272..b23d3d9794d 100644
--- a/base/base/iostream_debug_helpers.h
+++ b/base/base/iostream_debug_helpers.h
@@ -20,24 +20,26 @@ Out & dumpValue(Out &, T &&);
 
 /// Catch-all case.
 template <int priority, typename Out, typename T>
-std::enable_if_t<priority == -1, Out> & dumpImpl(Out & out, T &&) // NOLINT(cppcoreguidelines-missing-std-forward)
+requires(priority == -1)
+Out & dumpImpl(Out & out, T &&) // NOLINT(cppcoreguidelines-missing-std-forward)
 {
     return out << "{...}";
 }
 
 /// An object, that could be output with operator <<.
 template <int priority, typename Out, typename T>
-std::enable_if_t<priority == 0, Out> & dumpImpl(Out & out, T && x, std::decay_t<decltype(std::declval<Out &>() << std::declval<T>())> * = nullptr) // NOLINT(cppcoreguidelines-missing-std-forward)
+requires(priority == 0)
+Out & dumpImpl(Out & out, T && x, std::decay_t<decltype(std::declval<Out &>() << std::declval<T>())> * = nullptr) // NOLINT(cppcoreguidelines-missing-std-forward)
 {
     return out << x;
 }
 
 /// A pointer-like object.
 template <int priority, typename Out, typename T>
-std::enable_if_t<priority == 1
+requires(priority == 1
     /// Protect from the case when operator * do effectively nothing (function pointer).
-    && !std::is_same_v<std::decay_t<T>, std::decay_t<decltype(*std::declval<T>())>>
-    , Out> & dumpImpl(Out & out, T && x, std::decay_t<decltype(*std::declval<T>())> * = nullptr) // NOLINT(cppcoreguidelines-missing-std-forward)
+    && !std::is_same_v<std::decay_t<T>, std::decay_t<decltype(*std::declval<T>())>>)
+Out & dumpImpl(Out & out, T && x, std::decay_t<decltype(*std::declval<T>())> * = nullptr) // NOLINT(cppcoreguidelines-missing-std-forward)
 {
     if (!x)
         return out << "nullptr";
@@ -46,7 +48,8 @@ std::enable_if_t<priority == 1
 
 /// Container.
 template <int priority, typename Out, typename T>
-std::enable_if_t<priority == 2, Out> & dumpImpl(Out & out, T && x, std::decay_t<decltype(std::begin(std::declval<T>()))> * = nullptr) // NOLINT(cppcoreguidelines-missing-std-forward)
+requires(priority == 2)
+Out & dumpImpl(Out & out, T && x, std::decay_t<decltype(std::begin(std::declval<T>()))> * = nullptr) // NOLINT(cppcoreguidelines-missing-std-forward)
 {
     bool first = true;
     out << "{";
@@ -63,8 +66,8 @@ std::enable_if_t<priority == 2, Out> & dumpImpl(Out & out, T && x, std::decay_t<
 
 
 template <int priority, typename Out, typename T>
-std::enable_if_t<priority == 3 && std::is_enum_v<std::decay_t<T>>, Out> &
-dumpImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-forward)
+requires(priority == 3 && std::is_enum_v<std::decay_t<T>>)
+Out & dumpImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-forward)
 {
     return out << magic_enum::enum_name(x);
 }
@@ -72,8 +75,8 @@ dumpImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-forward)
 /// string and const char * - output not as container or pointer.
 
 template <int priority, typename Out, typename T>
-std::enable_if_t<priority == 3 && (std::is_same_v<std::decay_t<T>, std::string> || std::is_same_v<std::decay_t<T>, const char *>), Out> &
-dumpImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-forward)
+requires(priority == 3 && (std::is_same_v<std::decay_t<T>, std::string> || std::is_same_v<std::decay_t<T>, const char *>))
+Out & dumpImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-forward)
 {
     return out << std::quoted(x);
 }
@@ -81,8 +84,8 @@ dumpImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-forward)
 /// UInt8 - output as number, not char.
 
 template <int priority, typename Out, typename T>
-std::enable_if_t<priority == 3 && std::is_same_v<std::decay_t<T>, unsigned char>, Out> &
-dumpImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-forward)
+requires(priority == 3 && std::is_same_v<std::decay_t<T>, unsigned char>)
+Out & dumpImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-forward)
 {
     return out << int(x);
 }
@@ -108,7 +111,8 @@ Out & dumpTupleImpl(Out & out, T && x) // NOLINT(cppcoreguidelines-missing-std-f
 }
 
 template <int priority, typename Out, typename T>
-std::enable_if_t<priority == 4, Out> & dumpImpl(Out & out, T && x, std::decay_t<decltype(std::get<0>(std::declval<T>()))> * = nullptr) // NOLINT(cppcoreguidelines-missing-std-forward)
+requires(priority == 4)
+Out & dumpImpl(Out & out, T && x, std::decay_t<decltype(std::get<0>(std::declval<T>()))> * = nullptr) // NOLINT(cppcoreguidelines-missing-std-forward)
 {
     return dumpTupleImpl<0>(out, x);
 }
diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index fd8fd8de025..9a2d02e3388 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -250,14 +250,16 @@ ALWAYS_INLINE inline char * uitoa<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize
 //===----------------------------------------------------------===//
 
 // itoa: handle unsigned integral operands (selected by SFINAE)
-template <typename U, std::enable_if_t<!std::is_signed_v<U> && std::is_integral_v<U>> * = nullptr>
+template <typename U>
+requires(!std::is_signed_v<U> && std::is_integral_v<U>)
 ALWAYS_INLINE inline char * itoa(U u, char * p)
 {
     return convert::uitoa(p, u);
 }
 
 // itoa: handle signed integral operands (selected by SFINAE)
-template <typename I, size_t N = sizeof(I), std::enable_if_t<std::is_signed_v<I> && std::is_integral_v<I>> * = nullptr>
+template <typename I, size_t N = sizeof(I)>
+requires(std::is_signed_v<I> && std::is_integral_v<I>)
 ALWAYS_INLINE inline char * itoa(I i, char * p)
 {
     // Need "mask" to be filled with a copy of the sign bit.
diff --git a/base/base/range.h b/base/base/range.h
index aacd7e433a4..c75359a44c3 100644
--- a/base/base/range.h
+++ b/base/base/range.h
@@ -23,12 +23,10 @@ namespace internal
 
 /// For loop adaptor which is used to iterate through a half-closed interval [begin, end).
 /// The parameters `begin` and `end` can have any integral or enum types.
-template <typename BeginType,
-        typename EndType,
-        typename = std::enable_if_t<
-            (std::is_integral_v<BeginType> || std::is_enum_v<BeginType>) &&
-            (std::is_integral_v<EndType> || std::is_enum_v<EndType>) &&
-            (!std::is_enum_v<BeginType> || !std::is_enum_v<EndType> || std::is_same_v<BeginType, EndType>), void>>
+template <typename BeginType, typename EndType>
+requires((std::is_integral_v<BeginType> || std::is_enum_v<BeginType>) &&
+         (std::is_integral_v<EndType> || std::is_enum_v<EndType>) &&
+         (!std::is_enum_v<BeginType> || !std::is_enum_v<EndType> || std::is_same_v<BeginType, EndType>))
 inline auto range(BeginType begin, EndType end)
 {
     if constexpr (std::is_integral_v<BeginType> && std::is_integral_v<EndType>)
@@ -50,8 +48,8 @@ inline auto range(BeginType begin, EndType end)
 /// For loop adaptor which is used to iterate through a half-closed interval [0, end).
 /// The parameter `end` can have any integral or enum type.
 /// The same as range(0, end).
-template <typename Type,
-        typename = std::enable_if_t<std::is_integral_v<Type> || std::is_enum_v<Type>, void>>
+template <typename Type>
+requires(std::is_integral_v<Type> || std::is_enum_v<Type>)
 inline auto range(Type end)
 {
     if constexpr (std::is_integral_v<Type>)
diff --git a/base/base/sleep.cpp b/base/base/sleep.cpp
index 9611f8cc40f..312a5a5db0b 100644
--- a/base/base/sleep.cpp
+++ b/base/base/sleep.cpp
@@ -2,6 +2,7 @@
 
 #include <ctime>
 #include <cerrno>
+#include <system_error>
 
 #if defined(OS_DARWIN)
 #include <mach/mach.h>
@@ -34,7 +35,8 @@ void sleepForNanoseconds(uint64_t nanoseconds)
     constexpr auto clock_type = CLOCK_MONOTONIC;
 
     struct timespec current_time;
-    clock_gettime(clock_type, &current_time);
+    if (0 != clock_gettime(clock_type, &current_time))
+        throw std::system_error(std::error_code(errno, std::system_category()));
 
     constexpr uint64_t resolution = 1'000'000'000;
     struct timespec finish_time = current_time;
diff --git a/base/base/wide_integer.h b/base/base/wide_integer.h
index ffd30460c03..f3a4dc9e6d5 100644
--- a/base/base/wide_integer.h
+++ b/base/base/wide_integer.h
@@ -111,7 +111,8 @@ public:
 
     constexpr explicit operator bool() const noexcept;
 
-    template <typename T, typename = std::enable_if_t<std::is_arithmetic_v<T>, T>>
+    template <typename T>
+    requires(std::is_arithmetic_v<T>)
     constexpr operator T() const noexcept;
 
     constexpr operator long double() const noexcept;
@@ -208,12 +209,14 @@ constexpr integer<Bits, Signed> operator<<(const integer<Bits, Signed> & lhs, in
 template <size_t Bits, typename Signed>
 constexpr integer<Bits, Signed> operator>>(const integer<Bits, Signed> & lhs, int n) noexcept;
 
-template <size_t Bits, typename Signed, typename Int, typename = std::enable_if_t<!std::is_same_v<Int, int>>>
+template <size_t Bits, typename Signed, typename Int>
+requires(!std::is_same_v<Int, int>)
 constexpr integer<Bits, Signed> operator<<(const integer<Bits, Signed> & lhs, Int n) noexcept
 {
     return lhs << int(n);
 }
-template <size_t Bits, typename Signed, typename Int, typename = std::enable_if_t<!std::is_same_v<Int, int>>>
+template <size_t Bits, typename Signed, typename Int>
+requires(!std::is_same_v<Int, int>)
 constexpr integer<Bits, Signed> operator>>(const integer<Bits, Signed> & lhs, Int n) noexcept
 {
     return lhs >> int(n);
@@ -262,4 +265,3 @@ struct hash<wide::integer<Bits, Signed>>;
 // NOLINTEND(*)
 
 #include "wide_integer_impl.h"
-
diff --git a/base/base/wide_integer_impl.h b/base/base/wide_integer_impl.h
index 0e98b6e5ee6..3787971a20e 100644
--- a/base/base/wide_integer_impl.h
+++ b/base/base/wide_integer_impl.h
@@ -1246,7 +1246,8 @@ constexpr integer<Bits, Signed>::operator bool() const noexcept
 }
 
 template <size_t Bits, typename Signed>
-template <class T, class>
+template <class T>
+requires(std::is_arithmetic_v<T>)
 constexpr integer<Bits, Signed>::operator T() const noexcept
 {
     static_assert(std::numeric_limits<T>::is_integer);
diff --git a/src/Common/StackTrace.h b/src/Common/StackTrace.h
index a16d889a67a..61c27695f8a 100644
--- a/src/Common/StackTrace.h
+++ b/src/Common/StackTrace.h
@@ -44,7 +44,7 @@ public:
     using Frames = std::array<Frame, capacity>;
 
     /// Tries to capture stack trace
-    inline StackTrace() { tryCapture(); }
+    StackTrace() { tryCapture(); }
 
     /// Tries to capture stack trace. Fallbacks on parsing caller address from
     /// signal context if no stack trace could be captured

From f9965b6430040a2f1ef79a0e58b1cae0a98a81a5 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 8 May 2024 23:46:15 +0200
Subject: [PATCH 181/289] Review changes

---
 .../sql-reference/functions/date-time-functions.md  | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 493cc9b7648..03aa083a0f4 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -2869,7 +2869,7 @@ addMilliseconds(date_time, num)
 - `num`: Number of milliseconds to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` plus `num` milliseconds. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
+- Returns `date_time` plus `num` milliseconds. [DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2904,7 +2904,7 @@ addMicroseconds(date_time, num)
 - `num`: Number of microseconds to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` plus `num` microseconds. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
+- Returns `date_time` plus `num` microseconds. [DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2939,7 +2939,7 @@ addNanoseconds(date_time, num)
 - `num`: Number of nanoseconds to add. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` plus `num` nanoseconds. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
+- Returns `date_time` plus `num` nanoseconds. [DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -2970,14 +2970,14 @@ addInterval(interval_1, interval_2)
 
 **Parameters**
 
-- `interval_1`: First interval or interval of tuples. [interval](../data-types/special-data-types/interval.md), [tuple](../data-types/tuple.md)([interval](../data-types/special-data-types/interval.md)).
+- `interval_1`: First interval or tuple of intervals. [interval](../data-types/special-data-types/interval.md), [tuple](../data-types/tuple.md)([interval](../data-types/special-data-types/interval.md)).
 - `interval_2`: Second interval to be added. [interval](../data-types/special-data-types/interval.md).
 
 **Returned value**
 - Returns a tuple of intervals. [tuple](../data-types/tuple.md)([interval](../data-types/special-data-types/interval.md)).
 
 :::note
-If the types of the first interval (or the interval in the tuple) and the second interval are the same they will be merged into one interval.
+Intervals of the same type will be combined into a single interval. For instance if `toIntervalDay(1)` and `toIntervalDay(2)` are passed then the result will be `(3)` rather than `(1,1)`. 
 :::
 
 **Example**
@@ -3027,7 +3027,8 @@ addTupleOfIntervals(interval_1, interval_2)
 Query:
 
 ```sql
-WITH toDate('2018-01-01') AS date SELECT addTupleOfIntervals(date, (INTERVAL 1 DAY, INTERVAL 1 MONTH, INTERVAL 1 YEAR))
+WITH toDate('2018-01-01') AS date 
+SELECT addTupleOfIntervals(date, (INTERVAL 1 DAY, INTERVAL 1 MONTH, INTERVAL 1 YEAR))
 ```
 
 Result:

From 2f3231541c74d34fbf06d910708521a44dc515f4 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 8 May 2024 23:58:51 +0200
Subject: [PATCH 182/289] Make relevant changes to subtractXYZ

---
 docs/en/sql-reference/functions/date-time-functions.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 08da46255eb..843f22e5a6f 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -3351,7 +3351,7 @@ subtractMilliseconds(date_time, num)
 - `num`: Number of milliseconds to subtract. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` minus `num` milliseconds. [Date](../data-types/date.md)/[Date32](../data-types/date32.md)/[DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
+- Returns `date_time` minus `num` milliseconds. [DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -3386,7 +3386,7 @@ subtractMicroseconds(date_time, num)
 - `num`: Number of microseconds to subtract. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` minus `num` microseconds. [DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
+- Returns `date_time` minus `num` microseconds. [DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -3421,7 +3421,7 @@ subtractNanoseconds(date_time, num)
 - `num`: Number of nanoseconds to subtract. [(U)Int*](../data-types/int-uint.md), [Float*](../data-types/float.md).
 
 **Returned value**
-- Returns `date_time` minus `num` nanoseconds. [DateTime](../data-types/datetime.md)/[DateTime64](../data-types/datetime64.md).
+- Returns `date_time` minus `num` nanoseconds. [DateTime64](../data-types/datetime64.md).
 
 **Example**
 
@@ -3459,7 +3459,7 @@ subtractInterval(interval_1, interval_2)
 - Returns a tuple of intervals. [tuple](../data-types/tuple.md)([interval](../data-types/special-data-types/interval.md)).
 
 :::note
-If the types of the first interval (or the interval in the tuple) and the second interval are the same they will be merged into one interval.
+Intervals of the same type will be combined into a single interval. For instance if `toIntervalDay(2)` and `toIntervalDay(1)` are passed then the result will be `(1)` rather than `(2,1)`
 :::
 
 **Example**

From 95f12ef2744854ec49624cb9b5fc951e253258be Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 9 May 2024 01:08:33 +0200
Subject: [PATCH 183/289] Useless changes

---
 base/base/DecomposedFloat.h                   |  8 ++---
 programs/git-import/git-import.cpp            |  4 +--
 programs/main.cpp                             |  2 +-
 src/Access/AccessBackup.h                     |  2 +-
 src/Access/Common/AccessEntityType.h          |  2 +-
 src/Access/Common/AccessType.h                |  2 +-
 src/Access/Common/AuthenticationType.h        |  2 +-
 src/Access/Common/QuotaDefs.h                 |  4 +--
 src/Access/Common/RowPolicyDefs.h             |  2 +-
 src/Access/IAccessStorage.h                   |  2 +-
 src/Access/LDAPClient.h                       | 12 +++----
 .../AggregateFunctionGroupArray.cpp           |  2 +-
 .../AggregateFunctionGroupArraySorted.cpp     |  2 +-
 ...AggregateFunctionKolmogorovSmirnovTest.cpp |  2 +-
 .../AggregateFunctionMannWhitney.cpp          |  2 +-
 .../AggregateFunctionMaxIntersections.cpp     |  2 +-
 .../AggregateFunctionSequenceMatch.cpp        |  4 +--
 .../AggregateFunctionSequenceNextNode.cpp     |  4 +--
 .../AggregateFunctionStatistics.cpp           |  4 +--
 .../AggregateFunctionStatisticsSimple.h       |  2 +-
 .../AggregateFunctionVarianceMatrix.cpp       |  2 +-
 .../Combinators/AggregateFunctionOrFill.cpp   |  2 +-
 .../ReservoirSamplerDeterministic.h           |  2 +-
 src/Analyzer/ColumnTransformers.h             |  6 ++--
 src/Analyzer/IQueryTreeNode.h                 |  2 +-
 src/Analyzer/MatcherNode.h                    |  2 +-
 .../Passes/GroupingFunctionsResolvePass.cpp   |  3 +-
 src/Analyzer/SortNode.h                       |  2 +-
 .../BackupCoordinationReplicatedAccess.h      |  2 +-
 .../BackupCoordinationReplicatedSQLObjects.h  |  2 +-
 src/Backups/BackupEntriesCollector.cpp        |  8 ++++-
 src/Backups/BackupEntriesCollector.h          |  2 +-
 src/Backups/BackupFileInfo.cpp                |  2 +-
 src/Backups/BackupIO.h                        |  2 +-
 src/Backups/BackupIO_Default.h                |  2 +-
 src/Backups/BackupStatus.h                    |  2 +-
 src/Backups/BackupsWorker.cpp                 |  2 +-
 src/Backups/BackupsWorker.h                   |  2 +-
 src/Backups/IBackup.h                         |  2 +-
 src/Backups/IBackupCoordination.h             |  4 +--
 src/Backups/IRestoreCoordination.h            |  2 +-
 src/Backups/RestoreSettings.h                 |  4 +--
 src/Client/ConnectionPoolWithFailover.h       |  2 +-
 src/Client/HedgedConnectionsFactory.h         |  2 +-
 src/Client/IServerConnection.h                |  2 +-
 src/Common/AsyncLoader.h                      |  2 +-
 src/Common/AsyncTaskExecutor.h                |  2 +-
 src/Common/CgroupsMemoryUsageObserver.h       |  2 +-
 src/Common/ColumnsHashing.h                   |  2 +-
 src/Common/CombinedCardinalityEstimator.h     |  7 +++-
 src/Common/DateLUTImpl.h                      |  2 +-
 src/Common/Dwarf.h                            |  2 +-
 src/Common/FST.h                              |  2 +-
 src/Common/HTTPConnectionPool.h               |  2 +-
 src/Common/HyperLogLogCounter.h               |  4 +--
 src/Common/IntervalKind.h                     |  2 +-
 src/Common/JSONParsers/ElementTypes.h         |  2 +-
 .../NamedCollections/NamedCollectionUtils.h   |  2 +-
 src/Common/OvercommitTracker.h                |  4 +--
 src/Common/PageCache.h                        |  2 +-
 src/Common/ProxyConfiguration.h               |  2 +-
 src/Common/SettingConstraintWritability.h     |  2 +-
 src/Common/ShellCommandSettings.h             |  2 +-
 src/Common/ThreadProfileEvents.h              |  2 +-
 src/Common/VariableContext.h                  |  4 ++-
 src/Common/ZooKeeper/ZooKeeperCachingGetter.h |  2 +-
 src/Common/ZooKeeper/ZooKeeperCommon.h        |  2 +-
 src/Common/examples/arena_with_free_lists.cpp |  2 +-
 src/Common/filesystemHelpers.h                |  2 +-
 src/Compression/CompressionCodecT64.cpp       |  2 +-
 src/Compression/ICompressionCodec.h           |  2 +-
 src/Coordination/KeeperServer.h               |  8 ++++-
 src/Coordination/Standalone/Context.h         |  2 +-
 src/Core/BaseSettings.h                       |  2 +-
 src/Core/Joins.h                              | 12 +++----
 src/Core/LogsLevel.h                          |  2 +-
 src/Core/Protocol.h                           |  4 +--
 src/Core/SettingsEnums.h                      | 36 +++++++++----------
 src/Core/SettingsFields.h                     |  6 +++-
 src/Core/SortCursor.h                         |  2 +-
 src/Core/TypeId.h                             |  2 +-
 src/Core/Types.h                              |  2 +-
 src/Core/Types_fwd.h                          |  2 +-
 src/DataTypes/convertMySQLDataType.h          |  2 +-
 src/DataTypes/getLeastSupertype.h             |  2 +-
 src/DataTypes/registerDataTypeDateTime.cpp    |  2 +-
 src/Databases/LoadingStrictnessLevel.h        |  5 ++-
 src/Databases/MySQL/DatabaseMySQL.h           |  2 +-
 src/Dictionaries/IDictionary.h                |  4 +--
 src/Dictionaries/PolygonDictionary.h          |  4 +--
 src/Disks/DiskEncryptedTransaction.h          |  2 +-
 src/Disks/DiskType.h                          |  6 ++--
 src/Disks/IO/CachedOnDiskReadBufferFromFile.h |  2 +-
 src/Disks/IO/getThreadPoolReader.h            |  2 +-
 src/Disks/IVolume.h                           |  4 +--
 .../MetadataStorageTransactionState.h         |  2 +-
 .../ObjectStorages/Web/WebObjectStorage.h     |  2 +-
 src/Disks/WriteMode.h                         |  6 ++--
 src/Formats/BSONTypes.h                       |  4 +--
 src/Formats/FormatSettings.h                  | 24 ++++++-------
 src/Formats/MsgPackExtensionTypes.h           |  2 +-
 src/Formats/NumpyDataTypes.h                  |  2 +-
 src/Formats/ProtobufSchemas.h                 |  2 +-
 src/Functions/CastOverloadResolver.h          |  2 +-
 src/Functions/DateTimeTransforms.h            |  2 +-
 src/Functions/FunctionBase58Conversion.h      |  2 +-
 src/Functions/FunctionBinaryArithmetic.h      |  7 +++-
 src/Functions/FunctionsAES.h                  |  4 +--
 src/Functions/FunctionsCodingUUID.cpp         |  4 +--
 src/Functions/FunctionsConversion.cpp         |  6 ++--
 src/Functions/FunctionsExternalDictionaries.h |  2 +-
 src/Functions/FunctionsJSON.h                 |  2 +-
 src/Functions/FunctionsRound.h                |  6 ++--
 src/Functions/FunctionsStringSearch.h         |  6 ++--
 src/Functions/GatherUtils/GatherUtils.h       |  3 +-
 src/Functions/LeastGreatestGeneric.h          |  4 +--
 src/Functions/LeftRight.h                     |  2 +-
 src/Functions/MatchImpl.h                     |  6 ++--
 src/Functions/MultiMatchAnyImpl.h             |  2 +-
 src/Functions/PolygonUtils.h                  |  2 +-
 src/Functions/ReplaceRegexpImpl.h             |  2 +-
 src/Functions/ReplaceStringImpl.h             |  2 +-
 .../IUserDefinedSQLObjectsStorage.h           |  2 +-
 .../UserDefined/UserDefinedSQLObjectType.h    |  2 +-
 .../UserDefined/UserDefinedSQLObjectsBackup.h |  2 +-
 src/Functions/array/arrayAggregation.cpp      |  2 +-
 src/Functions/array/arrayFirstLastIndex.cpp   |  3 +-
 src/Functions/array/mapOp.cpp                 |  2 +-
 src/Functions/coverage.cpp                    |  2 +-
 src/Functions/currentProfiles.cpp             |  2 +-
 src/Functions/currentRoles.cpp                |  2 +-
 src/Functions/extractAllGroups.h              |  2 +-
 src/Functions/formatDateTime.cpp              |  4 +--
 src/Functions/formatQuery.cpp                 |  4 +--
 src/Functions/greatCircleDistance.cpp         |  2 +-
 src/Functions/idna.cpp                        |  2 +-
 src/Functions/parseDateTime.cpp               |  6 ++--
 src/Functions/punycode.cpp                    |  2 +-
 src/Functions/sleep.h                         |  2 +-
 src/Functions/toFixedString.h                 |  2 +-
 src/Functions/toStartOfInterval.cpp           |  4 ++-
 src/IO/Archives/ZipArchiveWriter.h            |  2 +-
 src/IO/CompressionMethod.h                    |  2 +-
 src/IO/FileEncryptionCommon.h                 |  2 +-
 src/IO/HadoopSnappyReadBuffer.h               |  2 +-
 src/IO/ReadHelpers.h                          |  2 +-
 src/IO/ReadSettings.h                         |  4 +--
 src/IO/S3/PocoHTTPClient.h                    |  4 +--
 src/Interpreters/ActionsDAG.h                 |  4 +--
 src/Interpreters/ActionsVisitor.h             |  2 +-
 src/Interpreters/AggregatedDataVariants.h     |  2 +-
 src/Interpreters/AsynchronousInsertQueue.h    |  2 +-
 src/Interpreters/Cache/FileSegmentInfo.h      |  6 ++--
 src/Interpreters/Cache/LRUFileCachePriority.h |  2 +-
 src/Interpreters/Cache/Metadata.h             |  4 +--
 src/Interpreters/Cache/QueryCache.h           |  4 +--
 src/Interpreters/CancellationCode.h           |  2 +-
 src/Interpreters/CollectJoinOnKeysVisitor.h   |  4 +--
 src/Interpreters/ComparisonGraph.h            |  2 +-
 src/Interpreters/Context.h                    |  6 ++--
 src/Interpreters/FilesystemCacheLog.h         |  2 +-
 .../FilesystemReadPrefetchesLog.h             |  2 +-
 src/Interpreters/GraceHashJoin.cpp            |  2 +-
 src/Interpreters/HashJoin.h                   |  2 +-
 src/Interpreters/IJoin.h                      |  2 +-
 src/Interpreters/IdentifierSemantic.h         |  2 +-
 src/Interpreters/InterpreterRenameQuery.h     |  2 +-
 src/Interpreters/InterpreterSelectQuery.h     |  2 +-
 src/Interpreters/JIT/CompileDAG.h             |  2 +-
 src/Interpreters/JIT/compileFunction.cpp      |  2 +-
 src/Interpreters/MergeJoin.h                  |  2 +-
 src/Interpreters/S3QueueLog.h                 |  2 +-
 src/Interpreters/SetVariants.h                |  2 +-
 .../WhereConstraintsOptimizer.cpp             |  2 +-
 src/Interpreters/WindowDescription.h          |  4 +--
 src/Parsers/ASTAlterQuery.h                   |  2 +-
 src/Parsers/ASTKillQueryQuery.h               |  2 +-
 src/Parsers/ASTSelectIntersectExceptQuery.h   |  2 +-
 src/Parsers/ASTTablesInSelectQuery.h          |  2 +-
 src/Parsers/Access/ASTSetRoleQuery.h          |  2 +-
 src/Parsers/ExpressionListParsers.cpp         |  8 ++---
 src/Parsers/IParser.h                         |  2 +-
 src/Parsers/IdentifierQuotingStyle.h          |  2 +-
 .../Kusto/KustoFunctions/IParserKQLFunction.h |  2 +-
 src/Parsers/Lexer.h                           |  3 +-
 src/Parsers/LiteralEscapingStyle.h            |  2 +-
 src/Parsers/ParserSystemQuery.cpp             |  2 +-
 src/Parsers/SelectUnionMode.h                 |  2 +-
 src/Processors/Executors/ExecutingGraph.h     |  2 +-
 .../Impl/ParallelFormattingOutputFormat.h     |  2 +-
 .../Formats/Impl/ParquetBlockInputFormat.h    |  2 +-
 .../Formats/Impl/ValuesBlockInputFormat.h     |  2 +-
 src/Processors/IProcessor.h                   |  2 +-
 src/Processors/QueryPlan/IQueryPlanStep.h     |  2 +-
 src/Processors/QueryPlan/ReadFromMergeTree.h  |  3 +-
 src/Processors/QueryPlan/SortingStep.h        |  2 +-
 src/Processors/QueryPlan/TotalsHavingStep.h   |  2 +-
 src/Processors/ResizeProcessor.h              |  8 ++---
 src/Processors/TTL/TTLUpdateInfoAlgorithm.h   |  2 +-
 .../CreateSetAndFilterOnTheFlyTransform.h     |  2 +-
 .../Transforms/ExceptionKeepingTransform.h    |  2 +-
 src/Processors/Transforms/SortingTransform.h  |  2 +-
 .../Transforms/TotalsHavingTransform.h        |  2 +-
 src/QueryPipeline/Pipe.h                      |  2 +-
 src/QueryPipeline/SizeLimits.h                |  2 +-
 src/QueryPipeline/StreamLocalLimits.h         |  2 +-
 src/Storages/AlterCommands.h                  |  2 +-
 src/Storages/ColumnDefault.h                  |  2 +-
 src/Storages/DataDestinationType.h            |  2 +-
 .../DataLakes/Iceberg/IcebergMetadata.cpp     |  4 +--
 src/Storages/FileLog/FileLogConsumer.h        |  2 +-
 src/Storages/FileLog/StorageFileLog.h         |  2 +-
 src/Storages/Hive/HiveFile.h                  |  2 +-
 src/Storages/Hive/StorageHive.h               |  2 +-
 src/Storages/MergeTree/ActiveDataPartSet.h    |  2 +-
 .../ApproximateNearestNeighborIndexesCommon.h |  4 +--
 .../MergeTree/BackgroundJobsAssignee.h        |  2 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |  4 +--
 src/Storages/MergeTree/KeyCondition.cpp       |  2 +-
 src/Storages/MergeTree/MergeAlgorithm.h       |  2 +-
 .../MergeTree/MergePlainMergeTreeTask.h       |  2 +-
 src/Storages/MergeTree/MergeTask.h            |  2 +-
 .../MergeTree/MergeTreeDataMergerMutator.h    |  4 +--
 .../MergeTree/MergeTreeDataPartState.h        |  2 +-
 src/Storages/MergeTree/MergeTreeIOSettings.h  |  2 +-
 src/Storages/MergeTree/MergeTreePartsMover.h  |  2 +-
 src/Storages/MergeTree/MergeTreeReadTask.h    |  2 +-
 src/Storages/MergeTree/MergeTreeSource.cpp    |  2 +-
 src/Storages/MergeTree/MergeType.h            |  2 +-
 .../MergeTree/MutatePlainMergeTreeTask.h      |  2 +-
 src/Storages/MergeTree/MutateTask.cpp         |  7 ++--
 src/Storages/MergeTree/MutateTask.h           |  2 +-
 .../ParallelReplicasReadingCoordinator.cpp    |  2 +-
 .../MergeTree/ReplicatedMergeMutateTaskBase.h |  4 +--
 .../MaterializedPostgreSQLConsumer.h          |  2 +-
 src/Storages/ProjectionsDescription.h         |  2 +-
 src/Storages/RabbitMQ/RabbitMQConsumer.h      |  2 +-
 src/Storages/RedisCommon.h                    |  2 +-
 src/Storages/S3Queue/S3QueueFilesMetadata.h   |  4 +--
 src/Storages/StorageDictionary.h              |  2 +-
 src/Storages/StorageReplicatedMergeTree.cpp   |  2 +-
 src/Storages/StorageReplicatedMergeTree.h     |  2 +-
 .../System/StorageSystemDDLWorkerQueue.cpp    |  2 +-
 .../System/StorageSystemServerSettings.cpp    |  2 +-
 .../System/StorageSystemZooKeeper.cpp         |  2 +-
 src/Storages/TTLMode.h                        |  2 +-
 246 files changed, 378 insertions(+), 355 deletions(-)

diff --git a/base/base/DecomposedFloat.h b/base/base/DecomposedFloat.h
index f152637b94e..4837782621e 100644
--- a/base/base/DecomposedFloat.h
+++ b/base/base/DecomposedFloat.h
@@ -51,11 +51,9 @@ struct DecomposedFloat
     /// Returns 0 for both +0. and -0.
     int sign() const
     {
-        return (exponent() == 0 && mantissa() == 0)
-            ? 0
-            : (isNegative()
-                ? -1
-                : 1);
+        if (exponent() == 0 && mantissa() == 0)
+            return 0;
+        return isNegative() ? -1 : 1;
     }
 
     uint16_t exponent() const
diff --git a/programs/git-import/git-import.cpp b/programs/git-import/git-import.cpp
index fdabeacd46e..eaf85df67b1 100644
--- a/programs/git-import/git-import.cpp
+++ b/programs/git-import/git-import.cpp
@@ -233,7 +233,7 @@ struct Commit
 };
 
 
-enum class FileChangeType
+enum class FileChangeType : uint8_t
 {
     Add,
     Delete,
@@ -291,7 +291,7 @@ struct FileChange
 };
 
 
-enum class LineType
+enum class LineType : uint8_t
 {
     Empty,
     Comment,
diff --git a/programs/main.cpp b/programs/main.cpp
index 65fcfb8fadf..4bb73399719 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -119,7 +119,7 @@ std::pair<std::string_view, std::string_view> clickhouse_short_names[] =
 };
 
 
-enum class InstructionFail
+enum class InstructionFail : uint8_t
 {
     NONE = 0,
     SSE3 = 1,
diff --git a/src/Access/AccessBackup.h b/src/Access/AccessBackup.h
index 1aaac589ccb..aa59d6bf201 100644
--- a/src/Access/AccessBackup.h
+++ b/src/Access/AccessBackup.h
@@ -8,7 +8,7 @@
 namespace DB
 {
 class AccessControl;
-enum class AccessEntityType;
+enum class AccessEntityType : uint8_t;
 struct IAccessEntity;
 using AccessEntityPtr = std::shared_ptr<const IAccessEntity>;
 class AccessRightsElements;
diff --git a/src/Access/Common/AccessEntityType.h b/src/Access/Common/AccessEntityType.h
index 12df7cf5538..fd8d1fe8421 100644
--- a/src/Access/Common/AccessEntityType.h
+++ b/src/Access/Common/AccessEntityType.h
@@ -7,7 +7,7 @@ namespace DB
 {
 
 /// Represents the type of an access entity (see the IAccessEntity class).
-enum class AccessEntityType
+enum class AccessEntityType : uint8_t
 {
     USER,
     ROLE,
diff --git a/src/Access/Common/AccessType.h b/src/Access/Common/AccessType.h
index 570e36bf6db..7f0eff2184b 100644
--- a/src/Access/Common/AccessType.h
+++ b/src/Access/Common/AccessType.h
@@ -7,7 +7,7 @@ namespace DB
 {
 
 /// Represents an access type which can be granted on databases, tables, columns, etc.
-enum class AccessType
+enum class AccessType : uint8_t
 {
 /// Macro M should be defined as M(name, aliases, node_type, parent_group_name)
 /// where name is identifier with underscores (instead of spaces);
diff --git a/src/Access/Common/AuthenticationType.h b/src/Access/Common/AuthenticationType.h
index 506c8abd3b1..a68549aff4c 100644
--- a/src/Access/Common/AuthenticationType.h
+++ b/src/Access/Common/AuthenticationType.h
@@ -6,7 +6,7 @@
 namespace DB
 {
 
-enum class AuthenticationType
+enum class AuthenticationType : uint8_t
 {
     /// User doesn't have to enter password.
     NO_PASSWORD,
diff --git a/src/Access/Common/QuotaDefs.h b/src/Access/Common/QuotaDefs.h
index 6618f01c8f9..74253833cfd 100644
--- a/src/Access/Common/QuotaDefs.h
+++ b/src/Access/Common/QuotaDefs.h
@@ -9,7 +9,7 @@ namespace DB
 using QuotaValue = UInt64;
 
 /// Kinds of resource what we wish to quota.
-enum class QuotaType
+enum class QuotaType : uint8_t
 {
     QUERIES,                                /// Number of queries.
     QUERY_SELECTS,                          /// Number of select queries.
@@ -45,7 +45,7 @@ struct QuotaTypeInfo
 
 /// Key to share quota consumption.
 /// Users with the same key share the same amount of resource.
-enum class QuotaKeyType
+enum class QuotaKeyType : uint8_t
 {
     NONE,       /// All users share the same quota.
     USER_NAME,  /// Connections with the same user name share the same quota.
diff --git a/src/Access/Common/RowPolicyDefs.h b/src/Access/Common/RowPolicyDefs.h
index bf2f632e98b..4197c58c18e 100644
--- a/src/Access/Common/RowPolicyDefs.h
+++ b/src/Access/Common/RowPolicyDefs.h
@@ -25,7 +25,7 @@ struct RowPolicyName
 
 /// Types of the filters of row policies.
 /// Currently only RowPolicyFilterType::SELECT is supported.
-enum class RowPolicyFilterType
+enum class RowPolicyFilterType : uint8_t
 {
     /// Filter is a SQL conditional expression used to figure out which rows should be visible
     /// for user or available for modification. If the expression returns NULL or false for some rows
diff --git a/src/Access/IAccessStorage.h b/src/Access/IAccessStorage.h
index b00c8bac849..4f980bf9212 100644
--- a/src/Access/IAccessStorage.h
+++ b/src/Access/IAccessStorage.h
@@ -24,7 +24,7 @@ namespace DB
 struct User;
 class Credentials;
 class ExternalAuthenticators;
-enum class AuthenticationType;
+enum class AuthenticationType : uint8_t;
 class BackupEntriesCollector;
 class RestorerFromBackup;
 
diff --git a/src/Access/LDAPClient.h b/src/Access/LDAPClient.h
index bf193bf6bb2..0bbd2c6e9c4 100644
--- a/src/Access/LDAPClient.h
+++ b/src/Access/LDAPClient.h
@@ -26,7 +26,7 @@ class LDAPClient
 public:
     struct SearchParams
     {
-        enum class Scope
+        enum class Scope : uint8_t
         {
             BASE,
             ONE_LEVEL,
@@ -57,20 +57,20 @@ public:
 
     struct Params
     {
-        enum class ProtocolVersion
+        enum class ProtocolVersion : uint8_t
         {
             V2,
             V3
         };
 
-        enum class TLSEnable
+        enum class TLSEnable : uint8_t
         {
             NO,
             YES_STARTTLS,
             YES
         };
 
-        enum class TLSProtocolVersion
+        enum class TLSProtocolVersion : uint8_t
         {
             SSL2,
             SSL3,
@@ -79,7 +79,7 @@ public:
             TLS1_2
         };
 
-        enum class TLSRequireCert
+        enum class TLSRequireCert : uint8_t
         {
             NEVER,
             ALLOW,
@@ -87,7 +87,7 @@ public:
             DEMAND
         };
 
-        enum class SASLMechanism
+        enum class SASLMechanism : uint8_t
         {
             UNKNOWN,
             SIMPLE
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
index 63002652166..f90e0af6afd 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
@@ -43,7 +43,7 @@ namespace ErrorCodes
 namespace
 {
 
-enum class Sampler
+enum class Sampler : uint8_t
 {
     NONE,
     RNG,
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index c633871c737..acf4646b6ab 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -47,7 +47,7 @@ namespace ErrorCodes
 namespace
 {
 
-enum class GroupArraySortedStrategy
+enum class GroupArraySortedStrategy : uint8_t
 {
     heap,
     sort
diff --git a/src/AggregateFunctions/AggregateFunctionKolmogorovSmirnovTest.cpp b/src/AggregateFunctions/AggregateFunctionKolmogorovSmirnovTest.cpp
index e1224fae2fb..736cca11f1e 100644
--- a/src/AggregateFunctions/AggregateFunctionKolmogorovSmirnovTest.cpp
+++ b/src/AggregateFunctions/AggregateFunctionKolmogorovSmirnovTest.cpp
@@ -31,7 +31,7 @@ namespace
 
 struct KolmogorovSmirnov : public StatisticalSample<Float64, Float64>
 {
-    enum class Alternative
+    enum class Alternative : uint8_t
     {
         TwoSided,
         Less,
diff --git a/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp b/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
index 8434f11eae6..f088737c340 100644
--- a/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMannWhitney.cpp
@@ -39,7 +39,7 @@ struct MannWhitneyData : public StatisticalSample<Float64, Float64>
      *the probability of X being greater than Y is equal to the probability of Y being greater than X".
      *Or "the distribution F of first sample equals to the distribution G of second sample".
      *Then alternative for this hypothesis (H1) is "two-sided"(F != G), "less"(F < G), "greater" (F > G). */
-    enum class Alternative
+    enum class Alternative : uint8_t
     {
         TwoSided,
         Less,
diff --git a/src/AggregateFunctions/AggregateFunctionMaxIntersections.cpp b/src/AggregateFunctions/AggregateFunctionMaxIntersections.cpp
index 66b5314e05c..05ed85a9004 100644
--- a/src/AggregateFunctions/AggregateFunctionMaxIntersections.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMaxIntersections.cpp
@@ -48,7 +48,7 @@ struct MaxIntersectionsData
     Array value;
 };
 
-enum class AggregateFunctionIntersectionsKind
+enum class AggregateFunctionIntersectionsKind : uint8_t
 {
     Count,
     Position
diff --git a/src/AggregateFunctions/AggregateFunctionSequenceMatch.cpp b/src/AggregateFunctions/AggregateFunctionSequenceMatch.cpp
index bc3d4da5e39..5b542a7d904 100644
--- a/src/AggregateFunctions/AggregateFunctionSequenceMatch.cpp
+++ b/src/AggregateFunctions/AggregateFunctionSequenceMatch.cpp
@@ -184,7 +184,7 @@ public:
     }
 
 private:
-    enum class PatternActionType
+    enum class PatternActionType : uint8_t
     {
         SpecificEvent,
         AnyEvent,
@@ -577,7 +577,7 @@ protected:
     }
 
 private:
-    enum class DFATransition : char
+    enum class DFATransition : uint8_t
     {
         ///   .-------.
         ///   |       |
diff --git a/src/AggregateFunctions/AggregateFunctionSequenceNextNode.cpp b/src/AggregateFunctions/AggregateFunctionSequenceNextNode.cpp
index 3bbd00f0662..bed10333af0 100644
--- a/src/AggregateFunctions/AggregateFunctionSequenceNextNode.cpp
+++ b/src/AggregateFunctions/AggregateFunctionSequenceNextNode.cpp
@@ -41,13 +41,13 @@ namespace ErrorCodes
 namespace
 {
 
-enum class SequenceDirection
+enum class SequenceDirection : uint8_t
 {
     Forward,
     Backward,
 };
 
-enum SequenceBase
+enum SequenceBase : uint8_t
 {
     Head,
     Tail,
diff --git a/src/AggregateFunctions/AggregateFunctionStatistics.cpp b/src/AggregateFunctions/AggregateFunctionStatistics.cpp
index 15fede94fe7..e128e06557e 100644
--- a/src/AggregateFunctions/AggregateFunctionStatistics.cpp
+++ b/src/AggregateFunctions/AggregateFunctionStatistics.cpp
@@ -104,7 +104,7 @@ struct AggregateFunctionVarianceData
     Float64 m2 = 0.0;
 };
 
-enum class VarKind
+enum class VarKind : uint8_t
 {
     varSampStable,
     stddevSampStable,
@@ -343,7 +343,7 @@ struct CovarianceData : public BaseCovarianceData<compute_marginal_moments>
     Float64 co_moment = 0.0;
 };
 
-enum class CovarKind
+enum class CovarKind : uint8_t
 {
     covarSampStable,
     covarPopStable,
diff --git a/src/AggregateFunctions/AggregateFunctionStatisticsSimple.h b/src/AggregateFunctions/AggregateFunctionStatisticsSimple.h
index cb20d54b2a8..efa4d6cd54c 100644
--- a/src/AggregateFunctions/AggregateFunctionStatisticsSimple.h
+++ b/src/AggregateFunctions/AggregateFunctionStatisticsSimple.h
@@ -35,7 +35,7 @@ namespace DB
 
 struct Settings;
 
-enum class StatisticsFunctionKind
+enum class StatisticsFunctionKind : uint8_t
 {
     varPop, varSamp,
     stddevPop, stddevSamp,
diff --git a/src/AggregateFunctions/AggregateFunctionVarianceMatrix.cpp b/src/AggregateFunctions/AggregateFunctionVarianceMatrix.cpp
index 81804b56221..bbdfeecee53 100644
--- a/src/AggregateFunctions/AggregateFunctionVarianceMatrix.cpp
+++ b/src/AggregateFunctions/AggregateFunctionVarianceMatrix.cpp
@@ -20,7 +20,7 @@ namespace ErrorCodes
 namespace
 {
 
-enum class StatisticsMatrixFunctionKind
+enum class StatisticsMatrixFunctionKind : uint8_t
 {
     covarPopMatrix,
     covarSampMatrix,
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionOrFill.cpp b/src/AggregateFunctions/Combinators/AggregateFunctionOrFill.cpp
index 99f43149d14..2f85ec6c066 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionOrFill.cpp
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionOrFill.cpp
@@ -7,7 +7,7 @@ namespace DB
 namespace
 {
 
-enum class Kind
+enum class Kind : uint8_t
 {
     OrNull,
     OrDefault
diff --git a/src/AggregateFunctions/ReservoirSamplerDeterministic.h b/src/AggregateFunctions/ReservoirSamplerDeterministic.h
index b7032a01884..f3cf2a683ed 100644
--- a/src/AggregateFunctions/ReservoirSamplerDeterministic.h
+++ b/src/AggregateFunctions/ReservoirSamplerDeterministic.h
@@ -50,7 +50,7 @@ namespace detail
 }
 
 /// What if there is not a single value - throw an exception, or return 0 or NaN in the case of double?
-enum class ReservoirSamplerDeterministicOnEmpty
+enum class ReservoirSamplerDeterministicOnEmpty : uint8_t
 {
     THROW,
     RETURN_NAN_OR_ZERO,
diff --git a/src/Analyzer/ColumnTransformers.h b/src/Analyzer/ColumnTransformers.h
index 9ae1f14575b..118b090417f 100644
--- a/src/Analyzer/ColumnTransformers.h
+++ b/src/Analyzer/ColumnTransformers.h
@@ -61,7 +61,7 @@ namespace DB
   */
 
 /// Column transformer type
-enum class ColumnTransfomerType
+enum class ColumnTransfomerType : uint8_t
 {
     APPLY,
     EXCEPT,
@@ -98,7 +98,7 @@ protected:
     explicit IColumnTransformerNode(size_t children_size);
 };
 
-enum class ApplyColumnTransformerType
+enum class ApplyColumnTransformerType : uint8_t
 {
     LAMBDA,
     FUNCTION
@@ -153,7 +153,7 @@ private:
 };
 
 /// Except column transformer type
-enum class ExceptColumnTransformerType
+enum class ExceptColumnTransformerType : uint8_t
 {
     REGEXP,
     COLUMN_LIST,
diff --git a/src/Analyzer/IQueryTreeNode.h b/src/Analyzer/IQueryTreeNode.h
index fc2cb2c53f6..df3687f8fd9 100644
--- a/src/Analyzer/IQueryTreeNode.h
+++ b/src/Analyzer/IQueryTreeNode.h
@@ -25,7 +25,7 @@ namespace ErrorCodes
 class WriteBuffer;
 
 /// Query tree node type
-enum class QueryTreeNodeType
+enum class QueryTreeNodeType : uint8_t
 {
     IDENTIFIER,
     MATCHER,
diff --git a/src/Analyzer/MatcherNode.h b/src/Analyzer/MatcherNode.h
index a7ec7d984c6..cfc601a5cee 100644
--- a/src/Analyzer/MatcherNode.h
+++ b/src/Analyzer/MatcherNode.h
@@ -37,7 +37,7 @@ namespace DB
   * Additionally each matcher can contain transformers, check ColumnTransformers.h.
   * In query tree matchers column transformers are represended as ListNode.
   */
-enum class MatcherNodeType
+enum class MatcherNodeType : uint8_t
 {
     ASTERISK,
     COLUMNS_REGEXP,
diff --git a/src/Analyzer/Passes/GroupingFunctionsResolvePass.cpp b/src/Analyzer/Passes/GroupingFunctionsResolvePass.cpp
index 085519c7220..e259ffa64a6 100644
--- a/src/Analyzer/Passes/GroupingFunctionsResolvePass.cpp
+++ b/src/Analyzer/Passes/GroupingFunctionsResolvePass.cpp
@@ -24,7 +24,7 @@ namespace ErrorCodes
 namespace
 {
 
-enum class GroupByKind
+enum class GroupByKind : uint8_t
 {
     ORDINARY,
     ROLLUP,
@@ -256,4 +256,3 @@ void GroupingFunctionsResolvePass::run(QueryTreeNodePtr & query_tree_node, Conte
 }
 
 }
-
diff --git a/src/Analyzer/SortNode.h b/src/Analyzer/SortNode.h
index 4d1f6f7c0f0..0ebdde61912 100644
--- a/src/Analyzer/SortNode.h
+++ b/src/Analyzer/SortNode.h
@@ -15,7 +15,7 @@ namespace DB
 class SortNode;
 using SortNodePtr = std::shared_ptr<SortNode>;
 
-enum class SortDirection
+enum class SortDirection : uint8_t
 {
     ASCENDING = 0,
     DESCENDING = 1
diff --git a/src/Backups/BackupCoordinationReplicatedAccess.h b/src/Backups/BackupCoordinationReplicatedAccess.h
index 9ed9e62c21a..23672c3799e 100644
--- a/src/Backups/BackupCoordinationReplicatedAccess.h
+++ b/src/Backups/BackupCoordinationReplicatedAccess.h
@@ -7,7 +7,7 @@
 
 namespace DB
 {
-enum class AccessEntityType;
+enum class AccessEntityType : uint8_t;
 
 /// This class is used by hosts to coordinate the access entities of ReplicatedAccessStorage they're writing to a backup.
 /// It's designed to make all hosts save the same access entities to the backup even in case the ReplicatedAccessStorage changes
diff --git a/src/Backups/BackupCoordinationReplicatedSQLObjects.h b/src/Backups/BackupCoordinationReplicatedSQLObjects.h
index 27aa08ee755..f086f3c954c 100644
--- a/src/Backups/BackupCoordinationReplicatedSQLObjects.h
+++ b/src/Backups/BackupCoordinationReplicatedSQLObjects.h
@@ -7,7 +7,7 @@
 
 namespace DB
 {
-enum class UserDefinedSQLObjectType;
+enum class UserDefinedSQLObjectType : uint8_t;
 
 /// This class is used by hosts to coordinate the user-defined SQL objects they're going to write to a backup.
 /// It's designed to make all hosts save the same objects to the backup even in case some objects change while
diff --git a/src/Backups/BackupEntriesCollector.cpp b/src/Backups/BackupEntriesCollector.cpp
index d91cf47c4d3..64ab2112326 100644
--- a/src/Backups/BackupEntriesCollector.cpp
+++ b/src/Backups/BackupEntriesCollector.cpp
@@ -689,7 +689,13 @@ bool BackupEntriesCollector::compareWithPrevious(String & mismatch_description)
         previous_tables_metadata = std::move(tables_metadata);
     });
 
-    enum class MismatchType { ADDED, REMOVED, CHANGED, NONE };
+    enum class MismatchType : uint8_t
+    {
+        ADDED,
+        REMOVED,
+        CHANGED,
+        NONE
+    };
 
     /// Helper function - used to compare the metadata of databases and tables.
     auto find_mismatch = [](const auto & metadata, const auto & previous_metadata)
diff --git a/src/Backups/BackupEntriesCollector.h b/src/Backups/BackupEntriesCollector.h
index c7bce077a2d..fda5774105e 100644
--- a/src/Backups/BackupEntriesCollector.h
+++ b/src/Backups/BackupEntriesCollector.h
@@ -21,7 +21,7 @@ class IBackupCoordination;
 class IDatabase;
 using DatabasePtr = std::shared_ptr<IDatabase>;
 struct StorageID;
-enum class AccessEntityType;
+enum class AccessEntityType : uint8_t;
 class QueryStatus;
 using QueryStatusPtr = std::shared_ptr<QueryStatus>;
 
diff --git a/src/Backups/BackupFileInfo.cpp b/src/Backups/BackupFileInfo.cpp
index 84b6d67f503..d5885052a3c 100644
--- a/src/Backups/BackupFileInfo.cpp
+++ b/src/Backups/BackupFileInfo.cpp
@@ -27,7 +27,7 @@ namespace
         return std::nullopt;
     }
 
-    enum class CheckBackupResult
+    enum class CheckBackupResult : uint8_t
     {
         HasPrefix,
         HasFull,
diff --git a/src/Backups/BackupIO.h b/src/Backups/BackupIO.h
index 91d57e5ab0a..ee2f38c785b 100644
--- a/src/Backups/BackupIO.h
+++ b/src/Backups/BackupIO.h
@@ -9,7 +9,7 @@ class IDisk;
 using DiskPtr = std::shared_ptr<IDisk>;
 class SeekableReadBuffer;
 class WriteBuffer;
-enum class WriteMode;
+enum class WriteMode : uint8_t;
 struct WriteSettings;
 struct ReadSettings;
 
diff --git a/src/Backups/BackupIO_Default.h b/src/Backups/BackupIO_Default.h
index 4dba0324703..cf65f0dbf46 100644
--- a/src/Backups/BackupIO_Default.h
+++ b/src/Backups/BackupIO_Default.h
@@ -13,7 +13,7 @@ using DiskPtr = std::shared_ptr<IDisk>;
 class ReadBuffer;
 class SeekableReadBuffer;
 class WriteBuffer;
-enum class WriteMode;
+enum class WriteMode : uint8_t;
 
 /// Represents operations of loading from disk or downloading for reading a backup.
 class BackupReaderDefault : public IBackupReader
diff --git a/src/Backups/BackupStatus.h b/src/Backups/BackupStatus.h
index aeec1417b54..398f2086cfa 100644
--- a/src/Backups/BackupStatus.h
+++ b/src/Backups/BackupStatus.h
@@ -6,7 +6,7 @@
 namespace DB
 {
 
-enum class BackupStatus
+enum class BackupStatus : uint8_t
 {
     /// Statuses of making backups
     CREATING_BACKUP,
diff --git a/src/Backups/BackupsWorker.cpp b/src/Backups/BackupsWorker.cpp
index 72151e0e08c..8143fa74a6f 100644
--- a/src/Backups/BackupsWorker.cpp
+++ b/src/Backups/BackupsWorker.cpp
@@ -256,7 +256,7 @@ namespace
 /// 1) there should be separate thread pools for BACKUP and RESTORE;
 /// 2) a task from a thread pool can't wait another task from the same thread pool. (Because if it schedules and waits
 /// while the thread pool is still occupied with the waiting task then a scheduled task can be never executed).
-enum class BackupsWorker::ThreadPoolId
+enum class BackupsWorker::ThreadPoolId : uint8_t
 {
     /// "BACKUP ON CLUSTER ASYNC" waits in background while "BACKUP ASYNC" is finished on the nodes of the cluster, then finalizes the backup.
     BACKUP_ASYNC_ON_CLUSTER,
diff --git a/src/Backups/BackupsWorker.h b/src/Backups/BackupsWorker.h
index 836f6d7ae2d..e7ace91dace 100644
--- a/src/Backups/BackupsWorker.h
+++ b/src/Backups/BackupsWorker.h
@@ -107,7 +107,7 @@ private:
     void setNumFilesAndSize(const BackupOperationID & id, size_t num_files, UInt64 total_size, size_t num_entries,
                             UInt64 uncompressed_size, UInt64 compressed_size, size_t num_read_files, UInt64 num_read_bytes);
 
-    enum class ThreadPoolId;
+    enum class ThreadPoolId : uint8_t;
     ThreadPool & getThreadPool(ThreadPoolId thread_pool_id);
 
     /// Waits for some time if `test_inject_sleep` is true.
diff --git a/src/Backups/IBackup.h b/src/Backups/IBackup.h
index 6f366a58103..0aa2d34657f 100644
--- a/src/Backups/IBackup.h
+++ b/src/Backups/IBackup.h
@@ -28,7 +28,7 @@ public:
     //virtual const String & getName() const = 0;
     virtual const String & getNameForLogging() const = 0;
 
-    enum class OpenMode
+    enum class OpenMode : uint8_t
     {
         READ,
         WRITE,
diff --git a/src/Backups/IBackupCoordination.h b/src/Backups/IBackupCoordination.h
index 4a9f8a23855..166a2c5bbbc 100644
--- a/src/Backups/IBackupCoordination.h
+++ b/src/Backups/IBackupCoordination.h
@@ -8,8 +8,8 @@ namespace DB
 class Exception;
 struct BackupFileInfo;
 using BackupFileInfos = std::vector<BackupFileInfo>;
-enum class AccessEntityType;
-enum class UserDefinedSQLObjectType;
+enum class AccessEntityType : uint8_t;
+enum class UserDefinedSQLObjectType : uint8_t;
 
 /// Replicas use this class to coordinate what they're writing to a backup while executing BACKUP ON CLUSTER.
 /// There are two implementation of this interface: BackupCoordinationLocal and BackupCoordinationRemote.
diff --git a/src/Backups/IRestoreCoordination.h b/src/Backups/IRestoreCoordination.h
index 7506e1d9b80..37229534286 100644
--- a/src/Backups/IRestoreCoordination.h
+++ b/src/Backups/IRestoreCoordination.h
@@ -6,7 +6,7 @@
 namespace DB
 {
 class Exception;
-enum class UserDefinedSQLObjectType;
+enum class UserDefinedSQLObjectType : uint8_t;
 class ASTCreateQuery;
 
 /// Replicas use this class to coordinate what they're reading from a backup while executing RESTORE ON CLUSTER.
diff --git a/src/Backups/RestoreSettings.h b/src/Backups/RestoreSettings.h
index 601d344bd9f..06ecbc80aef 100644
--- a/src/Backups/RestoreSettings.h
+++ b/src/Backups/RestoreSettings.h
@@ -9,7 +9,7 @@ namespace DB
 class ASTBackupQuery;
 
 /// How the RESTORE command will handle table/database existence.
-enum class RestoreTableCreationMode
+enum class RestoreTableCreationMode : uint8_t
 {
     /// RESTORE TABLE always tries to create a table and it throws an exception if the table already exists.
     kCreate,
@@ -24,7 +24,7 @@ enum class RestoreTableCreationMode
 using RestoreDatabaseCreationMode = RestoreTableCreationMode;
 
 /// How the RESTORE command will handle if an user (or role or profile) which it's going to restore already exists.
-enum class RestoreAccessCreationMode
+enum class RestoreAccessCreationMode : uint8_t
 {
     /// RESTORE will throw an exception if some user already exists.
     kCreate,
diff --git a/src/Client/ConnectionPoolWithFailover.h b/src/Client/ConnectionPoolWithFailover.h
index a363a50244e..7b9f480aa4e 100644
--- a/src/Client/ConnectionPoolWithFailover.h
+++ b/src/Client/ConnectionPoolWithFailover.h
@@ -22,7 +22,7 @@ namespace DB
   */
 
 /// Specifies how many connections to return from ConnectionPoolWithFailover::getMany() method.
-enum class PoolMode
+enum class PoolMode : uint8_t
 {
     /// Return exactly one connection.
     GET_ONE = 0,
diff --git a/src/Client/HedgedConnectionsFactory.h b/src/Client/HedgedConnectionsFactory.h
index c5bcbdf0689..51da85ea178 100644
--- a/src/Client/HedgedConnectionsFactory.h
+++ b/src/Client/HedgedConnectionsFactory.h
@@ -27,7 +27,7 @@ public:
     using ShuffledPool = ConnectionPoolWithFailover::Base::ShuffledPool;
     using TryResult = PoolWithFailoverBase<IConnectionPool>::TryResult;
 
-    enum class State
+    enum class State : uint8_t
     {
         READY,
         NOT_READY,
diff --git a/src/Client/IServerConnection.h b/src/Client/IServerConnection.h
index e7376491f8c..6ab4234bca2 100644
--- a/src/Client/IServerConnection.h
+++ b/src/Client/IServerConnection.h
@@ -68,7 +68,7 @@ class IServerConnection : boost::noncopyable
 public:
     virtual ~IServerConnection() = default;
 
-    enum class Type
+    enum class Type : uint8_t
     {
         SERVER,
         LOCAL
diff --git a/src/Common/AsyncLoader.h b/src/Common/AsyncLoader.h
index b254c9f2482..42707a4ee91 100644
--- a/src/Common/AsyncLoader.h
+++ b/src/Common/AsyncLoader.h
@@ -44,7 +44,7 @@ class AsyncLoader;
 void logAboutProgress(LoggerPtr log, size_t processed, size_t total, AtomicStopwatch & watch);
 
 // Execution status of a load job.
-enum class LoadStatus
+enum class LoadStatus : uint8_t
 {
     PENDING,  // Load job is not started yet.
     OK,       // Load job executed and was successful.
diff --git a/src/Common/AsyncTaskExecutor.h b/src/Common/AsyncTaskExecutor.h
index 5837955572e..0225b415c16 100644
--- a/src/Common/AsyncTaskExecutor.h
+++ b/src/Common/AsyncTaskExecutor.h
@@ -13,7 +13,7 @@
 namespace DB
 {
 
-enum class AsyncEventTimeoutType
+enum class AsyncEventTimeoutType : uint8_t
 {
     CONNECT,
     RECEIVE,
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index 51c5cd08124..edc1cee750a 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -30,7 +30,7 @@ public:
     using OnMemoryLimitFn = std::function<void(bool)>;
     using OnMemoryAmountAvailableChangedFn = std::function<void()>;
 
-    enum class CgroupsVersion
+    enum class CgroupsVersion : uint8_t
     {
         V1,
         V2
diff --git a/src/Common/ColumnsHashing.h b/src/Common/ColumnsHashing.h
index 25d2ddc684d..77854723d56 100644
--- a/src/Common/ColumnsHashing.h
+++ b/src/Common/ColumnsHashing.h
@@ -235,7 +235,7 @@ struct HashMethodSingleLowCardinalityColumn : public SingleColumnMethod
 {
     using Base = SingleColumnMethod;
 
-    enum class VisitValue
+    enum class VisitValue : uint8_t
     {
         Empty = 0,
         Found = 1,
diff --git a/src/Common/CombinedCardinalityEstimator.h b/src/Common/CombinedCardinalityEstimator.h
index 1911cafeaa2..0e53755d773 100644
--- a/src/Common/CombinedCardinalityEstimator.h
+++ b/src/Common/CombinedCardinalityEstimator.h
@@ -16,7 +16,12 @@ namespace ErrorCodes
 namespace details
 {
 
-enum class ContainerType : uint8_t { SMALL = 1, MEDIUM = 2, LARGE = 3 };
+enum class ContainerType : uint8_t
+{
+    SMALL = 1,
+    MEDIUM = 2,
+    LARGE = 3
+};
 
 static inline ContainerType max(const ContainerType & lhs, const ContainerType & rhs)
 {
diff --git a/src/Common/DateLUTImpl.h b/src/Common/DateLUTImpl.h
index 01cbae3d447..9993e50b710 100644
--- a/src/Common/DateLUTImpl.h
+++ b/src/Common/DateLUTImpl.h
@@ -41,7 +41,7 @@ enum class WeekModeFlag : UInt8
 using YearWeek = std::pair<UInt16, UInt8>;
 
 /// Modes for toDayOfWeek() function.
-enum class WeekDayMode
+enum class WeekDayMode : uint8_t
 {
     WeekStartsMonday1 = 0,
     WeekStartsMonday0 = 1,
diff --git a/src/Common/Dwarf.h b/src/Common/Dwarf.h
index 8f8df3acd1a..da18b3affa0 100644
--- a/src/Common/Dwarf.h
+++ b/src/Common/Dwarf.h
@@ -126,7 +126,7 @@ public:
         std::string_view name;
     };
 
-    enum class LocationInfoMode
+    enum class LocationInfoMode : uint8_t
     {
         // Don't resolve location info.
         DISABLED,
diff --git a/src/Common/FST.h b/src/Common/FST.h
index 7e51b807303..e2a1cbb20cb 100644
--- a/src/Common/FST.h
+++ b/src/Common/FST.h
@@ -70,7 +70,7 @@ class State
 {
 public:
     static constexpr size_t MAX_ARCS_IN_SEQUENTIAL_METHOD = 32;
-    enum class EncodingMethod
+    enum class EncodingMethod : uint8_t
     {
         /// Serialize arcs sequentially
         Sequential = 0,
diff --git a/src/Common/HTTPConnectionPool.h b/src/Common/HTTPConnectionPool.h
index a883a18ab8e..b5ec7cdd35f 100644
--- a/src/Common/HTTPConnectionPool.h
+++ b/src/Common/HTTPConnectionPool.h
@@ -52,7 +52,7 @@ protected:
 
 };
 
-enum class HTTPConnectionGroupType
+enum class HTTPConnectionGroupType : uint8_t
 {
     DISK,
     STORAGE,
diff --git a/src/Common/HyperLogLogCounter.h b/src/Common/HyperLogLogCounter.h
index 092ed6f3d80..bacd4cc7288 100644
--- a/src/Common/HyperLogLogCounter.h
+++ b/src/Common/HyperLogLogCounter.h
@@ -27,7 +27,7 @@ namespace ErrorCodes
 
 
 /// Sets denominator type.
-enum class DenominatorMode
+enum class DenominatorMode : uint8_t
 {
     Compact,        /// Compact denominator.
     StableIfBig,    /// Stable denominator falling back to Compact if rank storage is not big enough.
@@ -246,7 +246,7 @@ struct RankWidth<UInt64>
 
 
 /// Sets behavior of HyperLogLog class.
-enum class HyperLogLogMode
+enum class HyperLogLogMode : uint8_t
 {
     Raw,            /// No error correction.
     LinearCounting, /// LinearCounting error correction.
diff --git a/src/Common/IntervalKind.h b/src/Common/IntervalKind.h
index 497dc83be0b..f8e1fe87276 100644
--- a/src/Common/IntervalKind.h
+++ b/src/Common/IntervalKind.h
@@ -7,7 +7,7 @@ namespace DB
 /// Kind of a temporal interval.
 struct IntervalKind
 {
-    enum class Kind
+    enum class Kind : uint8_t
     {
         Nanosecond,
         Microsecond,
diff --git a/src/Common/JSONParsers/ElementTypes.h b/src/Common/JSONParsers/ElementTypes.h
index 44e4c850a2f..dd72555a437 100644
--- a/src/Common/JSONParsers/ElementTypes.h
+++ b/src/Common/JSONParsers/ElementTypes.h
@@ -3,7 +3,7 @@
 namespace DB
 {
 // Enum values match simdjson's for fast conversion
-enum class ElementType
+enum class ElementType : uint8_t
 {
     ARRAY = '[',
     OBJECT = '{',
diff --git a/src/Common/NamedCollections/NamedCollectionUtils.h b/src/Common/NamedCollections/NamedCollectionUtils.h
index 6cbe9101550..293b3ea659d 100644
--- a/src/Common/NamedCollections/NamedCollectionUtils.h
+++ b/src/Common/NamedCollections/NamedCollectionUtils.h
@@ -13,7 +13,7 @@ class ASTDropNamedCollectionQuery;
 namespace NamedCollectionUtils
 {
 
-enum class SourceId
+enum class SourceId : uint8_t
 {
     NONE = 0,
     CONFIG = 1,
diff --git a/src/Common/OvercommitTracker.h b/src/Common/OvercommitTracker.h
index f40a70fe7cd..7712ff999ef 100644
--- a/src/Common/OvercommitTracker.h
+++ b/src/Common/OvercommitTracker.h
@@ -42,7 +42,7 @@ namespace DB
     struct ProcessListForUser;
 }
 
-enum class OvercommitResult
+enum class OvercommitResult : uint8_t
 {
     NONE,
     DISABLED,
@@ -52,7 +52,7 @@ enum class OvercommitResult
     NOT_ENOUGH_FREED,
 };
 
-enum class QueryCancellationState
+enum class QueryCancellationState : uint8_t
 {
     NONE     = 0,  // Hard limit is not reached, there is no selected query to kill.
     SELECTED = 1,  // Hard limit is reached, query to stop was chosen but it still is not aware of cancellation.
diff --git a/src/Common/PageCache.h b/src/Common/PageCache.h
index 04411e6fc24..804db55ec85 100644
--- a/src/Common/PageCache.h
+++ b/src/Common/PageCache.h
@@ -103,7 +103,7 @@ struct AtomicBitSet
     void unsetAll() const;
 };
 
-enum class PageChunkState
+enum class PageChunkState : uint8_t
 {
     /// Pages are not reclaimable by the OS, the buffer has correct contents.
     Stable,
diff --git a/src/Common/ProxyConfiguration.h b/src/Common/ProxyConfiguration.h
index 289ae2b6813..97577735bce 100644
--- a/src/Common/ProxyConfiguration.h
+++ b/src/Common/ProxyConfiguration.h
@@ -13,7 +13,7 @@ namespace ErrorCodes
 
 struct ProxyConfiguration
 {
-    enum class Protocol
+    enum class Protocol : uint8_t
     {
         HTTP,
         HTTPS
diff --git a/src/Common/SettingConstraintWritability.h b/src/Common/SettingConstraintWritability.h
index 4a179dad286..41e96846d44 100644
--- a/src/Common/SettingConstraintWritability.h
+++ b/src/Common/SettingConstraintWritability.h
@@ -4,7 +4,7 @@
 namespace DB
 {
 
-enum class SettingConstraintWritability
+enum class SettingConstraintWritability : uint8_t
 {
     // Default. Setting can be change within specified range only in `readonly=0` or `readonly=2` mode.
     WRITABLE,
diff --git a/src/Common/ShellCommandSettings.h b/src/Common/ShellCommandSettings.h
index 4cfd862b873..1ac4bf6a30e 100644
--- a/src/Common/ShellCommandSettings.h
+++ b/src/Common/ShellCommandSettings.h
@@ -5,7 +5,7 @@
 namespace DB
 {
 
-enum class ExternalCommandStderrReaction
+enum class ExternalCommandStderrReaction : uint8_t
 {
     NONE, /// Do nothing.
     LOG, /// Try to log all outputs of stderr from the external command immediately.
diff --git a/src/Common/ThreadProfileEvents.h b/src/Common/ThreadProfileEvents.h
index c4703a69998..a3f79bf4d78 100644
--- a/src/Common/ThreadProfileEvents.h
+++ b/src/Common/ThreadProfileEvents.h
@@ -189,7 +189,7 @@ extern PerfEventsCounters current_thread_counters;
 class TasksStatsCounters
 {
 public:
-    enum class MetricsProvider
+    enum class MetricsProvider : uint8_t
     {
         None,
         Procfs,
diff --git a/src/Common/VariableContext.h b/src/Common/VariableContext.h
index fb9acd40aea..20ed74d754e 100644
--- a/src/Common/VariableContext.h
+++ b/src/Common/VariableContext.h
@@ -1,8 +1,10 @@
 #pragma once
 
+#include <cstdint>
+
 /// Used in ProfileEvents and MemoryTracker to determine their hierarchy level
 /// The less value the higher level (zero level is the root)
-enum class VariableContext
+enum class VariableContext : uint8_t
 {
     Global = 0,
     User,           /// Group of processes
diff --git a/src/Common/ZooKeeper/ZooKeeperCachingGetter.h b/src/Common/ZooKeeper/ZooKeeperCachingGetter.h
index 936ee660d8d..3d2f2df440f 100644
--- a/src/Common/ZooKeeper/ZooKeeperCachingGetter.h
+++ b/src/Common/ZooKeeper/ZooKeeperCachingGetter.h
@@ -8,7 +8,7 @@ namespace zkutil
 class ZooKeeperCachingGetter : boost::noncopyable
 {
 public:
-    enum class SessionStatus
+    enum class SessionStatus : uint8_t
     {
         New,
         Cached
diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.h b/src/Common/ZooKeeper/ZooKeeperCommon.h
index a1bd9b582e9..490c2dce4f8 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.h
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.h
@@ -625,7 +625,7 @@ private:
     ZooKeeperRequestFactory();
 };
 
-enum class PathMatchResult
+enum class PathMatchResult : uint8_t
 {
     NOT_MATCH,
     EXACT,
diff --git a/src/Common/examples/arena_with_free_lists.cpp b/src/Common/examples/arena_with_free_lists.cpp
index 63c2f231261..6793d567aca 100644
--- a/src/Common/examples/arena_with_free_lists.cpp
+++ b/src/Common/examples/arena_with_free_lists.cpp
@@ -137,7 +137,7 @@ struct Dictionary
     template <typename Value> using ContainerType = Value[];
     template <typename Value> using ContainerPtrType = std::unique_ptr<ContainerType<Value>>;
 
-    enum class AttributeUnderlyingTypeTest
+    enum class AttributeUnderlyingTypeTest : uint8_t
     {
         UInt8,
         UInt16,
diff --git a/src/Common/filesystemHelpers.h b/src/Common/filesystemHelpers.h
index a4eb212455d..4bc44398785 100644
--- a/src/Common/filesystemHelpers.h
+++ b/src/Common/filesystemHelpers.h
@@ -28,7 +28,7 @@ String getBlockDeviceId([[maybe_unused]] const String & path);
 
 std::optional<String> tryGetBlockDeviceId([[maybe_unused]] const String & path);
 
-enum class BlockDeviceType
+enum class BlockDeviceType : uint8_t
 {
     UNKNOWN = 0, // we were unable to determine device type
     NONROT = 1, // not a rotational device (SSD, NVME, etc)
diff --git a/src/Compression/CompressionCodecT64.cpp b/src/Compression/CompressionCodecT64.cpp
index 3ddc56fe4f6..9e9b32cf34b 100644
--- a/src/Compression/CompressionCodecT64.cpp
+++ b/src/Compression/CompressionCodecT64.cpp
@@ -27,7 +27,7 @@ public:
     /// There're 2 compression variants:
     /// Byte - transpose bit matrix by bytes (only the last not full byte is transposed by bits). It's default.
     /// Bits - full bit-transpose of the bit matrix. It uses more resources and leads to better compression with ZSTD (but worse with LZ4).
-    enum class Variant
+    enum class Variant : uint8_t
     {
         Byte,
         Bit
diff --git a/src/Compression/ICompressionCodec.h b/src/Compression/ICompressionCodec.h
index 18ff543d908..0e4b67798ac 100644
--- a/src/Compression/ICompressionCodec.h
+++ b/src/Compression/ICompressionCodec.h
@@ -54,7 +54,7 @@ public:
     /// --- For the codec with HW decompressor, it means submit request to HW and return immediately.
     /// --- Must be used in pair with flushAsynchronousDecompressRequests.
     /// SoftwareFallback mode is exclusively defined for the codec with HW decompressor, enable its capability of "fallback to SW codec".
-    enum class CodecMode
+    enum class CodecMode : uint8_t
     {
         Synchronous,
         Asynchronous,
diff --git a/src/Coordination/KeeperServer.h b/src/Coordination/KeeperServer.h
index dd54539a92b..5e45a552cba 100644
--- a/src/Coordination/KeeperServer.h
+++ b/src/Coordination/KeeperServer.h
@@ -128,7 +128,13 @@ public:
 
     int getServerID() const { return server_id; }
 
-    enum class ConfigUpdateState { Accepted, Declined, WaitBeforeChangingLeader };
+    enum class ConfigUpdateState : uint8_t
+    {
+        Accepted,
+        Declined,
+        WaitBeforeChangingLeader
+    };
+
     ConfigUpdateState applyConfigUpdate(
         const ClusterUpdateAction& action,
         bool last_command_was_leader_change = false);
diff --git a/src/Coordination/Standalone/Context.h b/src/Coordination/Standalone/Context.h
index adb9111185f..ff85e032814 100644
--- a/src/Coordination/Standalone/Context.h
+++ b/src/Coordination/Standalone/Context.h
@@ -127,7 +127,7 @@ public:
     std::shared_ptr<FilesystemReadPrefetchesLog> getFilesystemReadPrefetchesLog() const;
     std::shared_ptr<BlobStorageLog> getBlobStorageLog() const;
 
-    enum class ApplicationType
+    enum class ApplicationType : uint8_t
     {
         KEEPER
     };
diff --git a/src/Core/BaseSettings.h b/src/Core/BaseSettings.h
index 7191038a4ce..69c8c8bc240 100644
--- a/src/Core/BaseSettings.h
+++ b/src/Core/BaseSettings.h
@@ -20,7 +20,7 @@ namespace DB
 class ReadBuffer;
 class WriteBuffer;
 
-enum class SettingsWriteFormat
+enum class SettingsWriteFormat : uint8_t
 {
     BINARY,             /// Part of the settings are serialized as strings, and other part as variants. This is the old behaviour.
     STRINGS_WITH_FLAGS, /// All settings are serialized as strings. Before each value the flag `is_important` is serialized.
diff --git a/src/Core/Joins.h b/src/Core/Joins.h
index cc69f07263d..ccdd6eefab7 100644
--- a/src/Core/Joins.h
+++ b/src/Core/Joins.h
@@ -6,7 +6,7 @@ namespace DB
 {
 
 /// Join method.
-enum class JoinKind
+enum class JoinKind : uint8_t
 {
     Inner, /// Leave only rows that was JOINed.
     Left, /// If in "right" table there is no corresponding rows, use default values instead.
@@ -31,7 +31,7 @@ inline constexpr bool isInnerOrLeft(JoinKind kind)  { return kind == JoinKind::I
 inline constexpr bool isPaste(JoinKind kind)        { return kind == JoinKind::Paste; }
 
 /// Allows more optimal JOIN for typical cases.
-enum class JoinStrictness
+enum class JoinStrictness : uint8_t
 {
     Unspecified,
     RightAny, /// Old ANY JOIN. If there are many suitable rows in right table, use any from them to join.
@@ -45,7 +45,7 @@ enum class JoinStrictness
 const char * toString(JoinStrictness strictness);
 
 /// Algorithm for distributed query processing.
-enum class JoinLocality
+enum class JoinLocality : uint8_t
 {
     Unspecified,
     Local, /// Perform JOIN, using only data available on same servers (co-located data).
@@ -55,7 +55,7 @@ enum class JoinLocality
 const char * toString(JoinLocality locality);
 
 /// ASOF JOIN inequality type
-enum class ASOFJoinInequality
+enum class ASOFJoinInequality : uint8_t
 {
     None,
     Less,
@@ -96,7 +96,7 @@ inline constexpr ASOFJoinInequality reverseASOFJoinInequality(ASOFJoinInequality
     return ASOFJoinInequality::None;
 }
 
-enum class JoinAlgorithm
+enum class JoinAlgorithm : uint8_t
 {
     DEFAULT = 0,
     AUTO,
@@ -111,7 +111,7 @@ enum class JoinAlgorithm
 
 const char * toString(JoinAlgorithm join_algorithm);
 
-enum class JoinTableSide
+enum class JoinTableSide : uint8_t
 {
     Left,
     Right
diff --git a/src/Core/LogsLevel.h b/src/Core/LogsLevel.h
index 95721820d9c..d76f50f33ed 100644
--- a/src/Core/LogsLevel.h
+++ b/src/Core/LogsLevel.h
@@ -2,7 +2,7 @@
 
 namespace DB
 {
-enum class LogsLevel
+enum class LogsLevel : uint8_t
 {
     none = 0, /// Disable
     fatal,
diff --git a/src/Core/Protocol.h b/src/Core/Protocol.h
index 48107154753..3fc9e089451 100644
--- a/src/Core/Protocol.h
+++ b/src/Core/Protocol.h
@@ -190,14 +190,14 @@ namespace Protocol
     }
 
     /// Whether the compression must be used.
-    enum class Compression
+    enum class Compression : uint8_t
     {
         Disable = 0,
         Enable = 1,
     };
 
     /// Whether the ssl must be used.
-    enum class Secure
+    enum class Secure : uint8_t
     {
         Disable = 0,
         Enable = 1,
diff --git a/src/Core/SettingsEnums.h b/src/Core/SettingsEnums.h
index b17ff11d428..ab163ba96a3 100644
--- a/src/Core/SettingsEnums.h
+++ b/src/Core/SettingsEnums.h
@@ -115,7 +115,7 @@ constexpr auto getEnumValues();
         return getEnumValues<EnumType>().size();\
     }
 
-enum class LoadBalancing
+enum class LoadBalancing : uint8_t
 {
     /// among replicas with a minimum number of errors selected randomly
     RANDOM = 0,
@@ -142,7 +142,7 @@ DECLARE_SETTING_MULTI_ENUM(JoinAlgorithm)
 
 
 /// Which rows should be included in TOTALS.
-enum class TotalsMode
+enum class TotalsMode : uint8_t
 {
     BEFORE_HAVING            = 0, /// Count HAVING for all read rows;
                                   ///  including those not in max_rows_to_group_by
@@ -164,7 +164,7 @@ DECLARE_SETTING_ENUM_WITH_RENAME(OverflowModeGroupBy, OverflowMode)
 
 
 /// The setting for executing distributed subqueries inside IN or JOIN sections.
-enum class DistributedProductMode
+enum class DistributedProductMode : uint8_t
 {
     DENY = 0,    /// Disable
     LOCAL,       /// Convert to local query
@@ -175,7 +175,7 @@ enum class DistributedProductMode
 DECLARE_SETTING_ENUM(DistributedProductMode)
 
 /// How the query cache handles queries with non-deterministic functions, e.g. now()
-enum class QueryCacheNondeterministicFunctionHandling
+enum class QueryCacheNondeterministicFunctionHandling : uint8_t
 {
     Throw,
     Save,
@@ -185,7 +185,7 @@ enum class QueryCacheNondeterministicFunctionHandling
 DECLARE_SETTING_ENUM(QueryCacheNondeterministicFunctionHandling)
 
 /// How the query cache handles queries against system tables, tables in databases 'system.*' and 'information_schema.*'
-enum class QueryCacheSystemTableHandling
+enum class QueryCacheSystemTableHandling : uint8_t
 {
     Throw,
     Save,
@@ -217,7 +217,7 @@ enum QueryLogElementType : int8_t
 DECLARE_SETTING_ENUM_WITH_RENAME(LogQueriesType, QueryLogElementType)
 
 
-enum class DefaultDatabaseEngine
+enum class DefaultDatabaseEngine : uint8_t
 {
     Ordinary,
     Atomic,
@@ -225,7 +225,7 @@ enum class DefaultDatabaseEngine
 
 DECLARE_SETTING_ENUM(DefaultDatabaseEngine)
 
-enum class DefaultTableEngine
+enum class DefaultTableEngine : uint8_t
 {
     None = 0, /// Disable. Need to use ENGINE =
     Log,
@@ -242,7 +242,7 @@ enum class DefaultTableEngine
 DECLARE_SETTING_ENUM(DefaultTableEngine)
 
 
-enum class CleanDeletedRows
+enum class CleanDeletedRows : uint8_t
 {
     Never = 0, /// Disable.
     Always,
@@ -250,7 +250,7 @@ enum class CleanDeletedRows
 
 DECLARE_SETTING_ENUM(CleanDeletedRows)
 
-enum class MySQLDataTypesSupport
+enum class MySQLDataTypesSupport : uint8_t
 {
     DECIMAL, // convert MySQL's decimal and number to ClickHouse Decimal when applicable
     DATETIME64, // convert MySQL's DATETIME and TIMESTAMP and ClickHouse DateTime64 if precision is > 0 or range is greater that for DateTime.
@@ -260,7 +260,7 @@ enum class MySQLDataTypesSupport
 
 DECLARE_SETTING_MULTI_ENUM(MySQLDataTypesSupport)
 
-enum class SetOperationMode
+enum class SetOperationMode : uint8_t
 {
     Unspecified = 0, // Query UNION / EXCEPT / INTERSECT without SetOperationMode will throw exception
     ALL, // Query UNION / EXCEPT / INTERSECT without SetOperationMode -> SELECT ... UNION / EXCEPT / INTERSECT ALL SELECT ...
@@ -269,7 +269,7 @@ enum class SetOperationMode
 
 DECLARE_SETTING_ENUM(SetOperationMode)
 
-enum class DistributedDDLOutputMode
+enum class DistributedDDLOutputMode : uint8_t
 {
     NONE,
     THROW,
@@ -282,7 +282,7 @@ enum class DistributedDDLOutputMode
 
 DECLARE_SETTING_ENUM(DistributedDDLOutputMode)
 
-enum class StreamingHandleErrorMode
+enum class StreamingHandleErrorMode : uint8_t
 {
     DEFAULT = 0, // Ignore errors with threshold.
     STREAM, // Put errors to stream in the virtual column named ``_error.
@@ -292,7 +292,7 @@ enum class StreamingHandleErrorMode
 
 DECLARE_SETTING_ENUM(StreamingHandleErrorMode)
 
-enum class ShortCircuitFunctionEvaluation
+enum class ShortCircuitFunctionEvaluation : uint8_t
 {
     ENABLE, // Use short-circuit function evaluation for functions that are suitable for it.
     FORCE_ENABLE, // Use short-circuit function evaluation for all functions.
@@ -301,7 +301,7 @@ enum class ShortCircuitFunctionEvaluation
 
 DECLARE_SETTING_ENUM(ShortCircuitFunctionEvaluation)
 
-enum class TransactionsWaitCSNMode
+enum class TransactionsWaitCSNMode : uint8_t
 {
     ASYNC,
     WAIT,
@@ -322,7 +322,7 @@ DECLARE_SETTING_ENUM_WITH_RENAME(ArrowCompression, FormatSettings::ArrowCompress
 
 DECLARE_SETTING_ENUM_WITH_RENAME(ORCCompression, FormatSettings::ORCCompression)
 
-enum class Dialect
+enum class Dialect : uint8_t
 {
     clickhouse,
     kusto,
@@ -341,7 +341,7 @@ DECLARE_SETTING_ENUM(ParallelReplicasCustomKeyFilterType)
 
 DECLARE_SETTING_ENUM(LocalFSReadMethod)
 
-enum class S3QueueMode
+enum class S3QueueMode : uint8_t
 {
     ORDERED,
     UNORDERED,
@@ -349,7 +349,7 @@ enum class S3QueueMode
 
 DECLARE_SETTING_ENUM(S3QueueMode)
 
-enum class S3QueueAction
+enum class S3QueueAction : uint8_t
 {
     KEEP,
     DELETE,
@@ -359,7 +359,7 @@ DECLARE_SETTING_ENUM(S3QueueAction)
 
 DECLARE_SETTING_ENUM(ExternalCommandStderrReaction)
 
-enum class SchemaInferenceMode
+enum class SchemaInferenceMode : uint8_t
 {
     DEFAULT,
     UNION,
diff --git a/src/Core/SettingsFields.h b/src/Core/SettingsFields.h
index 64854e46ab5..19809348921 100644
--- a/src/Core/SettingsFields.h
+++ b/src/Core/SettingsFields.h
@@ -165,7 +165,11 @@ private:
 };
 
 
-enum class SettingFieldTimespanUnit { Millisecond, Second };
+enum class SettingFieldTimespanUnit : uint8_t
+{
+    Millisecond,
+    Second
+};
 
 template <SettingFieldTimespanUnit unit_>
 struct SettingFieldTimespan
diff --git a/src/Core/SortCursor.h b/src/Core/SortCursor.h
index 3c412fa1f17..56e50d3a94f 100644
--- a/src/Core/SortCursor.h
+++ b/src/Core/SortCursor.h
@@ -334,7 +334,7 @@ struct SortCursorWithCollation : SortCursorHelper<SortCursorWithCollation>
     }
 };
 
-enum class SortingQueueStrategy
+enum class SortingQueueStrategy : uint8_t
 {
     Default,
     Batch
diff --git a/src/Core/TypeId.h b/src/Core/TypeId.h
index 7003e880cd5..e6c5454b3bb 100644
--- a/src/Core/TypeId.h
+++ b/src/Core/TypeId.h
@@ -6,7 +6,7 @@ namespace DB
 {
 
 /// @note Except explicitly described you should not assume on TypeIndex numbers and/or their orders in this enum.
-enum class TypeIndex
+enum class TypeIndex : uint8_t
 {
     Nothing = 0,
     UInt8,
diff --git a/src/Core/Types.h b/src/Core/Types.h
index 2a930d09873..27c60f00147 100644
--- a/src/Core/Types.h
+++ b/src/Core/Types.h
@@ -21,7 +21,7 @@ namespace DB
 /// comparison which is used for nullable KeyCondition.
 struct Null
 {
-    enum class Value
+    enum class Value : int8_t
     {
         NegativeInfinity = -1,
         Null = 0,
diff --git a/src/Core/Types_fwd.h b/src/Core/Types_fwd.h
index c75d4d627b2..d3b1d168edf 100644
--- a/src/Core/Types_fwd.h
+++ b/src/Core/Types_fwd.h
@@ -32,7 +32,7 @@ struct IPv6;
 
 struct Null;
 
-enum class TypeIndex;
+enum class TypeIndex : uint8_t;
 
 /// Not a data type in database, defined just for convenience.
 using Strings = std::vector<String>;
diff --git a/src/DataTypes/convertMySQLDataType.h b/src/DataTypes/convertMySQLDataType.h
index 543119bc60e..4b1cbebc01b 100644
--- a/src/DataTypes/convertMySQLDataType.h
+++ b/src/DataTypes/convertMySQLDataType.h
@@ -7,7 +7,7 @@
 
 namespace DB
 {
-enum class MySQLDataTypesSupport;
+enum class MySQLDataTypesSupport : uint8_t;
 
 /// Convert MySQL type to ClickHouse data type.
 DataTypePtr convertMySQLDataType(MultiEnum<MySQLDataTypesSupport> type_support, const std::string & mysql_data_type, bool is_nullable, bool is_unsigned, size_t length, size_t precision, size_t scale);
diff --git a/src/DataTypes/getLeastSupertype.h b/src/DataTypes/getLeastSupertype.h
index ab920f726b9..2ae1e52ca96 100644
--- a/src/DataTypes/getLeastSupertype.h
+++ b/src/DataTypes/getLeastSupertype.h
@@ -4,7 +4,7 @@
 namespace DB
 {
 
-enum class LeastSupertypeOnError
+enum class LeastSupertypeOnError : uint8_t
 {
     Throw,
     String,
diff --git a/src/DataTypes/registerDataTypeDateTime.cpp b/src/DataTypes/registerDataTypeDateTime.cpp
index 2b5c4a0a143..802356cc108 100644
--- a/src/DataTypes/registerDataTypeDateTime.cpp
+++ b/src/DataTypes/registerDataTypeDateTime.cpp
@@ -16,7 +16,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
-enum class ArgumentKind
+enum class ArgumentKind : uint8_t
 {
     Optional,
     Mandatory
diff --git a/src/Databases/LoadingStrictnessLevel.h b/src/Databases/LoadingStrictnessLevel.h
index fe3be363cd2..53692bb56c1 100644
--- a/src/Databases/LoadingStrictnessLevel.h
+++ b/src/Databases/LoadingStrictnessLevel.h
@@ -1,10 +1,13 @@
 #pragma once
 
+#include <cstdint>
+
+
 namespace DB
 {
 
 /// Strictness mode for loading a table or database
-enum class LoadingStrictnessLevel
+enum class LoadingStrictnessLevel : uint8_t
 {
     /// Do all possible sanity checks
     CREATE = 0,
diff --git a/src/Databases/MySQL/DatabaseMySQL.h b/src/Databases/MySQL/DatabaseMySQL.h
index 084a8339be3..8e9f99e303e 100644
--- a/src/Databases/MySQL/DatabaseMySQL.h
+++ b/src/Databases/MySQL/DatabaseMySQL.h
@@ -27,7 +27,7 @@ namespace DB
 
 class Context;
 
-enum class MySQLDataTypesSupport;
+enum class MySQLDataTypesSupport : uint8_t;
 
 /** Real-time access to table list and table structure from remote MySQL
  *  It doesn't make any manipulations with filesystem.
diff --git a/src/Dictionaries/IDictionary.h b/src/Dictionaries/IDictionary.h
index bab80d3cd57..af2b57aa7ef 100644
--- a/src/Dictionaries/IDictionary.h
+++ b/src/Dictionaries/IDictionary.h
@@ -37,7 +37,7 @@ using DictionaryHierarchicalParentToChildIndexPtr = std::shared_ptr<DictionaryHi
   *
   * Complex is for dictionaries that support any combination of key columns.
   */
-enum class DictionaryKeyType
+enum class DictionaryKeyType : uint8_t
 {
     Simple,
     Complex
@@ -46,7 +46,7 @@ enum class DictionaryKeyType
 /** DictionarySpecialKeyType provides IDictionary client information about
   * which special key type is supported by dictionary.
   */
-enum class DictionarySpecialKeyType
+enum class DictionarySpecialKeyType : uint8_t
 {
     None,
     Range
diff --git a/src/Dictionaries/PolygonDictionary.h b/src/Dictionaries/PolygonDictionary.h
index e6eaa415c55..eb5396c84ee 100644
--- a/src/Dictionaries/PolygonDictionary.h
+++ b/src/Dictionaries/PolygonDictionary.h
@@ -34,7 +34,7 @@ public:
      *      - A point is represented by its coordinates stored in an according structure (see below).
      *  A simple polygon is represented by an one-dimensional array of points, stored in the according structure.
      */
-    enum class InputType
+    enum class InputType : uint8_t
     {
         MultiPolygon,
         SimplePolygon
@@ -42,7 +42,7 @@ public:
     /** Controls the different types allowed for providing the coordinates of points.
       * Right now a point can be represented by either an array or a tuple of two Float64 values.
       */
-    enum class PointType
+    enum class PointType : uint8_t
     {
         Array,
         Tuple,
diff --git a/src/Disks/DiskEncryptedTransaction.h b/src/Disks/DiskEncryptedTransaction.h
index 6cb2941cc11..94bd8ef5378 100644
--- a/src/Disks/DiskEncryptedTransaction.h
+++ b/src/Disks/DiskEncryptedTransaction.h
@@ -12,7 +12,7 @@
 namespace DB
 {
 
-namespace FileEncryption { enum class Algorithm; }
+namespace FileEncryption { enum class Algorithm : uint8_t; }
 
 struct DiskEncryptedSettings
 {
diff --git a/src/Disks/DiskType.h b/src/Disks/DiskType.h
index 8659f396270..347e2c1cfe3 100644
--- a/src/Disks/DiskType.h
+++ b/src/Disks/DiskType.h
@@ -6,14 +6,14 @@
 namespace DB
 {
 
-enum class DataSourceType
+enum class DataSourceType : uint8_t
 {
     Local,
     RAM,
     ObjectStorage,
 };
 
-enum class ObjectStorageType
+enum class ObjectStorageType : uint8_t
 {
     None,
     S3,
@@ -23,7 +23,7 @@ enum class ObjectStorageType
     Local,
 };
 
-enum class MetadataStorageType
+enum class MetadataStorageType : uint8_t
 {
     None,
     Local,
diff --git a/src/Disks/IO/CachedOnDiskReadBufferFromFile.h b/src/Disks/IO/CachedOnDiskReadBufferFromFile.h
index 74fb6220af2..3433698a162 100644
--- a/src/Disks/IO/CachedOnDiskReadBufferFromFile.h
+++ b/src/Disks/IO/CachedOnDiskReadBufferFromFile.h
@@ -57,7 +57,7 @@ public:
 
     String getFileName() const override { return source_file_path; }
 
-    enum class ReadType
+    enum class ReadType : uint8_t
     {
         CACHED,
         REMOTE_FS_READ_BYPASS_CACHE,
diff --git a/src/Disks/IO/getThreadPoolReader.h b/src/Disks/IO/getThreadPoolReader.h
index 243e0e5478f..14de15e3ea4 100644
--- a/src/Disks/IO/getThreadPoolReader.h
+++ b/src/Disks/IO/getThreadPoolReader.h
@@ -7,7 +7,7 @@ namespace DB
 
 class IAsynchronousReader;
 
-enum class FilesystemReaderType
+enum class FilesystemReaderType : uint8_t
 {
     SYNCHRONOUS_LOCAL_FS_READER,
     ASYNCHRONOUS_LOCAL_FS_READER,
diff --git a/src/Disks/IVolume.h b/src/Disks/IVolume.h
index 2da896a3514..400efa09aa1 100644
--- a/src/Disks/IVolume.h
+++ b/src/Disks/IVolume.h
@@ -8,14 +8,14 @@
 namespace DB
 {
 
-enum class VolumeType
+enum class VolumeType : uint8_t
 {
     JBOD,
     SINGLE_DISK,
     UNKNOWN
 };
 
-enum class VolumeLoadBalancing
+enum class VolumeLoadBalancing : uint8_t
 {
     ROUND_ROBIN,
     LEAST_USED,
diff --git a/src/Disks/ObjectStorages/MetadataStorageTransactionState.h b/src/Disks/ObjectStorages/MetadataStorageTransactionState.h
index fb05d185a37..6f515596d2f 100644
--- a/src/Disks/ObjectStorages/MetadataStorageTransactionState.h
+++ b/src/Disks/ObjectStorages/MetadataStorageTransactionState.h
@@ -4,7 +4,7 @@
 namespace DB
 {
 
-enum class MetadataStorageTransactionState
+enum class MetadataStorageTransactionState : uint8_t
 {
     PREPARING,
     FAILED,
diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.h b/src/Disks/ObjectStorages/Web/WebObjectStorage.h
index a285742c66d..b8ab510a6fb 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.h
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.h
@@ -98,7 +98,7 @@ protected:
     [[noreturn]] static void throwNotAllowed();
     bool exists(const std::string & path) const;
 
-    enum class FileType
+    enum class FileType : uint8_t
     {
         File,
         Directory
diff --git a/src/Disks/WriteMode.h b/src/Disks/WriteMode.h
index 4a73e92ccab..65eee90322a 100644
--- a/src/Disks/WriteMode.h
+++ b/src/Disks/WriteMode.h
@@ -3,10 +3,8 @@
 namespace DB
 {
 
-/**
- * Mode of opening a file for write.
- */
-enum class WriteMode
+/// Mode of opening a file for write.
+enum class WriteMode : uint8_t
 {
     Rewrite,
     Append
diff --git a/src/Formats/BSONTypes.h b/src/Formats/BSONTypes.h
index 14a3e9decca..cfef390267b 100644
--- a/src/Formats/BSONTypes.h
+++ b/src/Formats/BSONTypes.h
@@ -13,7 +13,7 @@ using BSONSizeT = uint32_t;
 static const BSONSizeT MAX_BSON_SIZE = std::numeric_limits<BSONSizeT>::max();
 
 /// See details on https://bsonspec.org/spec.html
-enum class BSONType
+enum class BSONType : uint8_t
 {
     DOUBLE = 0x01,
     STRING = 0x02,
@@ -38,7 +38,7 @@ enum class BSONType
     MAX_KEY = 0x7F,
 };
 
-enum class BSONBinarySubtype
+enum class BSONBinarySubtype : uint8_t
 {
     BINARY = 0x00,
     FUNCTION = 0x01,
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 83b5c534297..f29fc51af6a 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -49,7 +49,7 @@ struct FormatSettings
     bool try_infer_datetimes = false;
     bool try_infer_exponent_floats = false;
 
-    enum class DateTimeInputFormat
+    enum class DateTimeInputFormat : uint8_t
     {
         Basic,        /// Default format for fast parsing: YYYY-MM-DD hh:mm:ss (ISO-8601 without fractional part and timezone) or NNNNNNNNNN unix timestamp.
         BestEffort,   /// Use sophisticated rules to parse whatever possible.
@@ -58,14 +58,14 @@ struct FormatSettings
 
     DateTimeInputFormat date_time_input_format = DateTimeInputFormat::Basic;
 
-    enum class DateTimeOutputFormat
+    enum class DateTimeOutputFormat : uint8_t
     {
         Simple,
         ISO,
         UnixTimestamp
     };
 
-    enum class EscapingRule
+    enum class EscapingRule : uint8_t
     {
         None,
         Escaped,
@@ -80,7 +80,7 @@ struct FormatSettings
 
     DateTimeOutputFormat date_time_output_format = DateTimeOutputFormat::Simple;
 
-    enum class IntervalOutputFormat
+    enum class IntervalOutputFormat : uint8_t
     {
         Kusto,
         Numeric
@@ -91,7 +91,7 @@ struct FormatSettings
         IntervalOutputFormat output_format = IntervalOutputFormat::Numeric;
     } interval{};
 
-    enum class DateTimeOverflowBehavior
+    enum class DateTimeOverflowBehavior : uint8_t
     {
         Ignore,
         Throw,
@@ -114,7 +114,7 @@ struct FormatSettings
 
     size_t max_threads = 1;
 
-    enum class ArrowCompression
+    enum class ArrowCompression : uint8_t
     {
         NONE,
         LZ4_FRAME,
@@ -232,7 +232,7 @@ struct FormatSettings
         String column_for_object_name{};
     } json_object_each_row{};
 
-    enum class ParquetVersion
+    enum class ParquetVersion : uint8_t
     {
         V1_0,
         V2_4,
@@ -240,7 +240,7 @@ struct FormatSettings
         V2_LATEST,
     };
 
-    enum class ParquetCompression
+    enum class ParquetCompression : uint8_t
     {
         NONE,
         SNAPPY,
@@ -285,7 +285,7 @@ struct FormatSettings
         bool output_format_pretty_row_numbers = false;
         UInt64 output_format_pretty_single_large_number_tip_threshold = 1'000'000;
 
-        enum class Charset
+        enum class Charset : uint8_t
         {
             UTF8,
             ASCII,
@@ -372,7 +372,7 @@ struct FormatSettings
         bool escape_quote_with_quote = false;
     } values{};
 
-    enum class ORCCompression
+    enum class ORCCompression : uint8_t
     {
         NONE,
         LZ4,
@@ -397,7 +397,7 @@ struct FormatSettings
 
     /// For capnProto format we should determine how to
     /// compare ClickHouse Enum and Enum from schema.
-    enum class CapnProtoEnumComparingMode
+    enum class CapnProtoEnumComparingMode : uint8_t
     {
         BY_NAMES, // Names in enums should be the same, values can be different.
         BY_NAMES_CASE_INSENSITIVE, // Case-insensitive name comparison.
@@ -411,7 +411,7 @@ struct FormatSettings
         bool use_autogenerated_schema = true;
     } capn_proto{};
 
-    enum class MsgPackUUIDRepresentation
+    enum class MsgPackUUIDRepresentation : uint8_t
     {
         STR, // Output UUID as a string of 36 characters.
         BIN, // Output UUID as 16-bytes binary.
diff --git a/src/Formats/MsgPackExtensionTypes.h b/src/Formats/MsgPackExtensionTypes.h
index 2f7d28eb5bf..ef745b18c66 100644
--- a/src/Formats/MsgPackExtensionTypes.h
+++ b/src/Formats/MsgPackExtensionTypes.h
@@ -3,7 +3,7 @@
 namespace DB
 {
 
-enum class MsgPackExtensionTypes
+enum class MsgPackExtensionTypes : uint8_t
 {
     UUIDType = 0x02,
 };
diff --git a/src/Formats/NumpyDataTypes.h b/src/Formats/NumpyDataTypes.h
index 712797515c9..cb40c67cd19 100644
--- a/src/Formats/NumpyDataTypes.h
+++ b/src/Formats/NumpyDataTypes.h
@@ -7,7 +7,7 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
 }
 
-enum class NumpyDataTypeIndex
+enum class NumpyDataTypeIndex : uint8_t
 {
     Int8,
     Int16,
diff --git a/src/Formats/ProtobufSchemas.h b/src/Formats/ProtobufSchemas.h
index 48683cbdd1b..066f89d5176 100644
--- a/src/Formats/ProtobufSchemas.h
+++ b/src/Formats/ProtobufSchemas.h
@@ -28,7 +28,7 @@ class FormatSchemaInfo;
 class ProtobufSchemas : private boost::noncopyable
 {
 public:
-    enum class WithEnvelope
+    enum class WithEnvelope : uint8_t
     {
         // Return descriptor for a top-level message with a user-provided name.
         // Example: In protobuf schema
diff --git a/src/Functions/CastOverloadResolver.h b/src/Functions/CastOverloadResolver.h
index 4346478e5b6..7d98f774812 100644
--- a/src/Functions/CastOverloadResolver.h
+++ b/src/Functions/CastOverloadResolver.h
@@ -11,7 +11,7 @@ namespace DB
 class IFunctionOverloadResolver;
 using FunctionOverloadResolverPtr = std::shared_ptr<IFunctionOverloadResolver>;
 
-enum class CastType
+enum class CastType : uint8_t
 {
     nonAccurate,
     accurate,
diff --git a/src/Functions/DateTimeTransforms.h b/src/Functions/DateTimeTransforms.h
index a489c3cb859..d3d3eb3f790 100644
--- a/src/Functions/DateTimeTransforms.h
+++ b/src/Functions/DateTimeTransforms.h
@@ -1671,7 +1671,7 @@ struct ToISOWeekImpl
     using FactorTransform = ToISOYearImpl;
 };
 
-enum class ResultPrecision
+enum class ResultPrecision : uint8_t
 {
     Standard,
     Extended
diff --git a/src/Functions/FunctionBase58Conversion.h b/src/Functions/FunctionBase58Conversion.h
index ae8cd30959a..e519f9768cc 100644
--- a/src/Functions/FunctionBase58Conversion.h
+++ b/src/Functions/FunctionBase58Conversion.h
@@ -62,7 +62,7 @@ struct Base58Encode
     }
 };
 
-enum class Base58DecodeErrorHandling
+enum class Base58DecodeErrorHandling : uint8_t
 {
     ThrowException,
     ReturnEmptyString
diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 89ff63995b1..a67627a1072 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -236,7 +236,12 @@ namespace impl_
   * Etc.
   */
 
-enum class OpCase { Vector, LeftConstant, RightConstant };
+enum class OpCase : uint8_t
+{
+    Vector,
+    LeftConstant,
+    RightConstant
+};
 
 constexpr const auto & undec(const auto & x) { return x; }
 constexpr const auto & undec(const is_decimal auto & x) { return x.value; }
diff --git a/src/Functions/FunctionsAES.h b/src/Functions/FunctionsAES.h
index 7f6c331e5cd..14745460658 100644
--- a/src/Functions/FunctionsAES.h
+++ b/src/Functions/FunctionsAES.h
@@ -42,13 +42,13 @@ StringRef foldEncryptionKeyInMySQLCompatitableMode(size_t cipher_key_size, Strin
 
 const EVP_CIPHER * getCipherByName(StringRef name);
 
-enum class CompatibilityMode
+enum class CompatibilityMode : uint8_t
 {
     MySQL,
     OpenSSL
 };
 
-enum class CipherMode
+enum class CipherMode : uint8_t
 {
     MySQLCompatibility,   // with key folding
     OpenSSLCompatibility, // just as regular openssl's enc application does (AEAD modes, like GCM and CCM are not supported)
diff --git a/src/Functions/FunctionsCodingUUID.cpp b/src/Functions/FunctionsCodingUUID.cpp
index dfef9a8a9ba..6a44f4263a8 100644
--- a/src/Functions/FunctionsCodingUUID.cpp
+++ b/src/Functions/FunctionsCodingUUID.cpp
@@ -30,7 +30,7 @@ namespace DB::ErrorCodes
 
 namespace
 {
-enum class Representation
+enum class Representation : uint8_t
 {
     BigEndian,
     LittleEndian
@@ -66,7 +66,7 @@ void parseHex(const UInt8 * __restrict src, const std::span<UInt8> dst, Represen
 class UUIDSerializer
 {
 public:
-    enum class Variant
+    enum class Variant : uint8_t
     {
         Default = 1,
         Microsoft = 2
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 0da84d6d224..b2a90517b73 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -798,14 +798,14 @@ inline bool tryParseImpl<DataTypeIPv6>(DataTypeIPv6::FieldType & x, ReadBuffer &
 }
 
 
-enum class ConvertFromStringExceptionMode
+enum class ConvertFromStringExceptionMode : uint8_t
 {
     Throw,  /// Throw exception if value cannot be parsed.
     Zero,   /// Fill with zero or default if value cannot be parsed.
     Null    /// Return ColumnNullable with NULLs when value cannot be parsed.
 };
 
-enum class ConvertFromStringParsingMode
+enum class ConvertFromStringParsingMode : uint8_t
 {
     Normal,
     BestEffort,  /// Only applicable for DateTime. Will use sophisticated method, that is slower.
@@ -1128,7 +1128,7 @@ struct AccurateOrNullConvertStrategyAdditions
     UInt32 scale { 0 };
 };
 
-enum class BehaviourOnErrorFromString
+enum class BehaviourOnErrorFromString : uint8_t
 {
     ConvertDefaultBehaviorTag,
     ConvertReturnNullOnErrorTag,
diff --git a/src/Functions/FunctionsExternalDictionaries.h b/src/Functions/FunctionsExternalDictionaries.h
index 4460a8bd7bd..6cdac667e62 100644
--- a/src/Functions/FunctionsExternalDictionaries.h
+++ b/src/Functions/FunctionsExternalDictionaries.h
@@ -297,7 +297,7 @@ private:
     mutable FunctionDictHelper helper;
 };
 
-enum class DictionaryGetFunctionType
+enum class DictionaryGetFunctionType : uint8_t
 {
     get,
     getOrDefault,
diff --git a/src/Functions/FunctionsJSON.h b/src/Functions/FunctionsJSON.h
index 75c274a365f..a9cf59ce322 100644
--- a/src/Functions/FunctionsJSON.h
+++ b/src/Functions/FunctionsJSON.h
@@ -171,7 +171,7 @@ private:
     /// For example, the call JSONExtractInt('{"a": "hello", "b": [-100, 200.0, 300]}', 'b', 1)
     /// contains two moves: {MoveType::ConstKey, "b"} and {MoveType::ConstIndex, 1}.
     /// Keys and indices can be nonconst, in this case they are calculated for each row.
-    enum class MoveType
+    enum class MoveType : uint8_t
     {
         Key,
         Index,
diff --git a/src/Functions/FunctionsRound.h b/src/Functions/FunctionsRound.h
index 3d1028c6d35..7cb5c28323a 100644
--- a/src/Functions/FunctionsRound.h
+++ b/src/Functions/FunctionsRound.h
@@ -60,14 +60,14 @@ namespace ErrorCodes
 
 /** This parameter controls the behavior of the rounding functions.
   */
-enum class ScaleMode
+enum class ScaleMode : uint8_t
 {
     Positive,   // round to a number with N decimal places after the decimal point
     Negative,   // round to an integer with N zero characters
     Zero,       // round to an integer
 };
 
-enum class RoundingMode
+enum class RoundingMode : uint8_t
 {
 #ifdef __SSE4_1__
     Round   = _MM_FROUND_TO_NEAREST_INT | _MM_FROUND_NO_EXC,
@@ -82,7 +82,7 @@ enum class RoundingMode
 #endif
 };
 
-enum class TieBreakingMode
+enum class TieBreakingMode : uint8_t
 {
     Auto, // use banker's rounding for floating point numbers, round up otherwise
     Bankers, // use banker's rounding
diff --git a/src/Functions/FunctionsStringSearch.h b/src/Functions/FunctionsStringSearch.h
index 64de5d98ae3..924a66c1130 100644
--- a/src/Functions/FunctionsStringSearch.h
+++ b/src/Functions/FunctionsStringSearch.h
@@ -63,13 +63,13 @@ namespace ErrorCodes
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
-enum class ExecutionErrorPolicy
+enum class ExecutionErrorPolicy : uint8_t
 {
     Null,
     Throw
 };
 
-enum class HaystackNeedleOrderIsConfigurable
+enum class HaystackNeedleOrderIsConfigurable : uint8_t
 {
     No,     /// function arguments are always: (haystack, needle[, position])
     Yes     /// depending on a setting, the function arguments are (haystack, needle[, position]) or (needle, haystack[, position])
@@ -81,7 +81,7 @@ template <typename Impl,
 class FunctionsStringSearch : public IFunction
 {
 private:
-    enum class ArgumentOrder
+    enum class ArgumentOrder : uint8_t
     {
         HaystackNeedle,
         NeedleHaystack
diff --git a/src/Functions/GatherUtils/GatherUtils.h b/src/Functions/GatherUtils/GatherUtils.h
index 52a01b6ff62..5cdeb0c9fba 100644
--- a/src/Functions/GatherUtils/GatherUtils.h
+++ b/src/Functions/GatherUtils/GatherUtils.h
@@ -30,7 +30,7 @@
 namespace DB::GatherUtils
 {
 
-enum class ArraySearchType
+enum class ArraySearchType : uint8_t
 {
     Any, // Corresponds to the hasAny array function
     All, // Corresponds to the hasAll array function
@@ -91,4 +91,3 @@ void resizeDynamicSize(IArraySource & array_source, IValueSource & value_source,
 void resizeConstantSize(IArraySource & array_source, IValueSource & value_source, IArraySink & sink, ssize_t size);
 
 }
-
diff --git a/src/Functions/LeastGreatestGeneric.h b/src/Functions/LeastGreatestGeneric.h
index 422392b96b1..9073f14d679 100644
--- a/src/Functions/LeastGreatestGeneric.h
+++ b/src/Functions/LeastGreatestGeneric.h
@@ -18,7 +18,7 @@ namespace ErrorCodes
 }
 
 
-enum class LeastGreatest
+enum class LeastGreatest : uint8_t
 {
     Least,
     Greatest
@@ -134,5 +134,3 @@ private:
 };
 
 }
-
-
diff --git a/src/Functions/LeftRight.h b/src/Functions/LeftRight.h
index 2ea41b55252..bfa6f2194f4 100644
--- a/src/Functions/LeftRight.h
+++ b/src/Functions/LeftRight.h
@@ -26,7 +26,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
-enum class SubstringDirection
+enum class SubstringDirection : uint8_t
 {
     Left,
     Right
diff --git a/src/Functions/MatchImpl.h b/src/Functions/MatchImpl.h
index 5c2838f2544..55b2fee5400 100644
--- a/src/Functions/MatchImpl.h
+++ b/src/Functions/MatchImpl.h
@@ -81,19 +81,19 @@ inline bool likePatternIsSubstring(std::string_view pattern, String & res)
 // For more readable instantiations of MatchImpl<>
 struct MatchTraits
 {
-enum class Syntax
+enum class Syntax : uint8_t
 {
     Like,
     Re2
 };
 
-enum class Case
+enum class Case : uint8_t
 {
     Sensitive,
     Insensitive
 };
 
-enum class Result
+enum class Result : uint8_t
 {
     DontNegate,
     Negate
diff --git a/src/Functions/MultiMatchAnyImpl.h b/src/Functions/MultiMatchAnyImpl.h
index 0b9eee2382f..e173eb2e757 100644
--- a/src/Functions/MultiMatchAnyImpl.h
+++ b/src/Functions/MultiMatchAnyImpl.h
@@ -32,7 +32,7 @@ namespace ErrorCodes
 /// For more readable instantiations of MultiMatchAnyImpl<>
 struct MultiMatchTraits
 {
-enum class Find
+enum class Find : uint8_t
 {
     Any,
     AnyIndex
diff --git a/src/Functions/PolygonUtils.h b/src/Functions/PolygonUtils.h
index 9c28e349413..c4851718da6 100644
--- a/src/Functions/PolygonUtils.h
+++ b/src/Functions/PolygonUtils.h
@@ -170,7 +170,7 @@ public:
     inline bool ALWAYS_INLINE contains(CoordinateType x, CoordinateType y) const;
 
 private:
-    enum class CellType
+    enum class CellType : uint8_t
     {
         inner,                                  /// The cell is completely inside polygon.
         outer,                                  /// The cell is completely outside of polygon.
diff --git a/src/Functions/ReplaceRegexpImpl.h b/src/Functions/ReplaceRegexpImpl.h
index ecb4de97dc2..24a40c45c6e 100644
--- a/src/Functions/ReplaceRegexpImpl.h
+++ b/src/Functions/ReplaceRegexpImpl.h
@@ -16,7 +16,7 @@ namespace ErrorCodes
 
 struct ReplaceRegexpTraits
 {
-    enum class Replace
+    enum class Replace : uint8_t
     {
         First,
         All
diff --git a/src/Functions/ReplaceStringImpl.h b/src/Functions/ReplaceStringImpl.h
index cd2dc1d3636..de3942acbd8 100644
--- a/src/Functions/ReplaceStringImpl.h
+++ b/src/Functions/ReplaceStringImpl.h
@@ -15,7 +15,7 @@ namespace ErrorCodes
 
 struct ReplaceStringTraits
 {
-    enum class Replace
+    enum class Replace : uint8_t
     {
         First,
         All
diff --git a/src/Functions/UserDefined/IUserDefinedSQLObjectsStorage.h b/src/Functions/UserDefined/IUserDefinedSQLObjectsStorage.h
index 345ff8c5954..91b89bcfd67 100644
--- a/src/Functions/UserDefined/IUserDefinedSQLObjectsStorage.h
+++ b/src/Functions/UserDefined/IUserDefinedSQLObjectsStorage.h
@@ -11,7 +11,7 @@ namespace DB
 {
 class IAST;
 struct Settings;
-enum class UserDefinedSQLObjectType;
+enum class UserDefinedSQLObjectType : uint8_t;
 
 /// Interface for a storage of user-defined SQL objects.
 /// Implementations: UserDefinedSQLObjectsDiskStorage, UserDefinedSQLObjectsZooKeeperStorage
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectType.h b/src/Functions/UserDefined/UserDefinedSQLObjectType.h
index f7e6fff5cad..039b7183575 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectType.h
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectType.h
@@ -4,7 +4,7 @@
 namespace DB
 {
 
-enum class UserDefinedSQLObjectType
+enum class UserDefinedSQLObjectType : uint8_t
 {
     Function
 };
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.h b/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.h
index a1e970d8af5..301832e8b12 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.h
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.h
@@ -8,7 +8,7 @@ namespace DB
 {
 class BackupEntriesCollector;
 class RestorerFromBackup;
-enum class UserDefinedSQLObjectType;
+enum class UserDefinedSQLObjectType : uint8_t;
 class IBackupEntry;
 using BackupEntryPtr = std::shared_ptr<const IBackupEntry>;
 
diff --git a/src/Functions/array/arrayAggregation.cpp b/src/Functions/array/arrayAggregation.cpp
index 6a0010e4124..03aa5fb9086 100644
--- a/src/Functions/array/arrayAggregation.cpp
+++ b/src/Functions/array/arrayAggregation.cpp
@@ -28,7 +28,7 @@ namespace ErrorCodes
     extern const int ARGUMENT_OUT_OF_BOUND;
 }
 
-enum class AggregateOperation
+enum class AggregateOperation : uint8_t
 {
     min,
     max,
diff --git a/src/Functions/array/arrayFirstLastIndex.cpp b/src/Functions/array/arrayFirstLastIndex.cpp
index 045558609a4..858b5ffac5a 100644
--- a/src/Functions/array/arrayFirstLastIndex.cpp
+++ b/src/Functions/array/arrayFirstLastIndex.cpp
@@ -12,7 +12,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_COLUMN;
 }
 
-enum class ArrayFirstLastIndexStrategy
+enum class ArrayFirstLastIndexStrategy : uint8_t
 {
     First,
     Last
@@ -132,4 +132,3 @@ REGISTER_FUNCTION(ArrayFirstIndex)
 }
 
 }
-
diff --git a/src/Functions/array/mapOp.cpp b/src/Functions/array/mapOp.cpp
index 50b64cf9809..6f4b3bc0e2c 100644
--- a/src/Functions/array/mapOp.cpp
+++ b/src/Functions/array/mapOp.cpp
@@ -37,7 +37,7 @@ struct TupArg
 };
 using TupleMaps = std::vector<TupArg>;
 
-enum class OpTypes
+enum class OpTypes : uint8_t
 {
     ADD = 0,
     SUBTRACT = 1
diff --git a/src/Functions/coverage.cpp b/src/Functions/coverage.cpp
index f3eb23faca7..0698438c2ba 100644
--- a/src/Functions/coverage.cpp
+++ b/src/Functions/coverage.cpp
@@ -20,7 +20,7 @@ namespace DB
 namespace
 {
 
-enum class Kind
+enum class Kind : uint8_t
 {
     Current,
     Cumulative,
diff --git a/src/Functions/currentProfiles.cpp b/src/Functions/currentProfiles.cpp
index 8f14943e011..e816c75e1d4 100644
--- a/src/Functions/currentProfiles.cpp
+++ b/src/Functions/currentProfiles.cpp
@@ -15,7 +15,7 @@ namespace DB
 
 namespace
 {
-    enum class Kind
+    enum class Kind : uint8_t
     {
         currentProfiles,
         enabledProfiles,
diff --git a/src/Functions/currentRoles.cpp b/src/Functions/currentRoles.cpp
index e577bd5377a..3586f1373ea 100644
--- a/src/Functions/currentRoles.cpp
+++ b/src/Functions/currentRoles.cpp
@@ -17,7 +17,7 @@ namespace DB
 
 namespace
 {
-    enum class Kind
+    enum class Kind : uint8_t
     {
         CURRENT_ROLES,
         ENABLED_ROLES,
diff --git a/src/Functions/extractAllGroups.h b/src/Functions/extractAllGroups.h
index ac12cad1698..dfcd0e31715 100644
--- a/src/Functions/extractAllGroups.h
+++ b/src/Functions/extractAllGroups.h
@@ -25,7 +25,7 @@ namespace ErrorCodes
 }
 
 
-enum class ExtractAllGroupsResultKind
+enum class ExtractAllGroupsResultKind : uint8_t
 {
     VERTICAL,
     HORIZONTAL
diff --git a/src/Functions/formatDateTime.cpp b/src/Functions/formatDateTime.cpp
index 03fcff3af12..5a992f321f4 100644
--- a/src/Functions/formatDateTime.cpp
+++ b/src/Functions/formatDateTime.cpp
@@ -43,13 +43,13 @@ namespace
 {
 using Pos = const char *;
 
-enum class SupportInteger
+enum class SupportInteger : uint8_t
 {
     Yes,
     No
 };
 
-enum class FormatSyntax
+enum class FormatSyntax : uint8_t
 {
     MySQL,
     Joda
diff --git a/src/Functions/formatQuery.cpp b/src/Functions/formatQuery.cpp
index d7addcc284e..3b632147864 100644
--- a/src/Functions/formatQuery.cpp
+++ b/src/Functions/formatQuery.cpp
@@ -20,13 +20,13 @@ namespace ErrorCodes
 namespace
 {
 
-enum class OutputFormatting
+enum class OutputFormatting : uint8_t
 {
     SingleLine,
     MultiLine
 };
 
-enum class ErrorHandling
+enum class ErrorHandling : uint8_t
 {
     Exception,
     Null
diff --git a/src/Functions/greatCircleDistance.cpp b/src/Functions/greatCircleDistance.cpp
index 01184f74b13..1c12317f510 100644
--- a/src/Functions/greatCircleDistance.cpp
+++ b/src/Functions/greatCircleDistance.cpp
@@ -41,7 +41,7 @@ namespace ErrorCodes
 namespace
 {
 
-enum class Method
+enum class Method : uint8_t
 {
     SPHERE_DEGREES,
     SPHERE_METERS,
diff --git a/src/Functions/idna.cpp b/src/Functions/idna.cpp
index c9682b44b2c..5a7ae3485ba 100644
--- a/src/Functions/idna.cpp
+++ b/src/Functions/idna.cpp
@@ -26,7 +26,7 @@ namespace ErrorCodes
 /// - idnaEncode(), tryIdnaEncode() and idnaDecode(), see https://en.wikipedia.org/wiki/Internationalized_domain_name#ToASCII_and_ToUnicode
 ///   and [3] https://www.unicode.org/reports/tr46/#ToUnicode
 
-enum class ErrorHandling
+enum class ErrorHandling : uint8_t
 {
     Throw,  /// Throw exception
     Empty   /// Return empty string
diff --git a/src/Functions/parseDateTime.cpp b/src/Functions/parseDateTime.cpp
index d9613120c94..11e210d2cc2 100644
--- a/src/Functions/parseDateTime.cpp
+++ b/src/Functions/parseDateTime.cpp
@@ -37,13 +37,13 @@ namespace
 {
     using Pos = const char *;
 
-    enum class ParseSyntax
+    enum class ParseSyntax : uint8_t
     {
         MySQL,
         Joda
     };
 
-    enum class ErrorHandling
+    enum class ErrorHandling : uint8_t
     {
         Exception,
         Zero,
@@ -713,7 +713,7 @@ namespace
         class Instruction
         {
         private:
-            enum class NeedCheckSpace
+            enum class NeedCheckSpace : uint8_t
             {
                 Yes,
                 No
diff --git a/src/Functions/punycode.cpp b/src/Functions/punycode.cpp
index 107302069b4..8004e3731b5 100644
--- a/src/Functions/punycode.cpp
+++ b/src/Functions/punycode.cpp
@@ -24,7 +24,7 @@ namespace ErrorCodes
 /// Implementation of
 /// - punycodeEncode(), punycodeDecode() and tryPunycodeDecode(), see https://en.wikipedia.org/wiki/Punycode
 
-enum class ErrorHandling
+enum class ErrorHandling : uint8_t
 {
     Throw,  /// Throw exception
     Empty   /// Return empty string
diff --git a/src/Functions/sleep.h b/src/Functions/sleep.h
index 84f08dd5440..22748e86888 100644
--- a/src/Functions/sleep.h
+++ b/src/Functions/sleep.h
@@ -34,7 +34,7 @@ namespace ErrorCodes
 /** sleep(seconds) - the specified number of seconds sleeps each columns.
   */
 
-enum class FunctionSleepVariant
+enum class FunctionSleepVariant : uint8_t
 {
     PerBlock,
     PerRow
diff --git a/src/Functions/toFixedString.h b/src/Functions/toFixedString.h
index 9c7ffc48004..23cab2a65f5 100644
--- a/src/Functions/toFixedString.h
+++ b/src/Functions/toFixedString.h
@@ -21,7 +21,7 @@ namespace ErrorCodes
     extern const int NOT_IMPLEMENTED;
 }
 
-enum class ConvertToFixedStringExceptionMode
+enum class ConvertToFixedStringExceptionMode : uint8_t
 {
     Throw,
     Null
diff --git a/src/Functions/toStartOfInterval.cpp b/src/Functions/toStartOfInterval.cpp
index 7f25a317466..e55259e6394 100644
--- a/src/Functions/toStartOfInterval.cpp
+++ b/src/Functions/toStartOfInterval.cpp
@@ -52,12 +52,14 @@ public:
         };
 
         const DataTypeInterval * interval_type = nullptr;
-        enum class ResultType
+
+        enum class ResultType : uint8_t
         {
             Date,
             DateTime,
             DateTime64
         };
+
         ResultType result_type;
         auto check_second_argument = [&]
         {
diff --git a/src/IO/Archives/ZipArchiveWriter.h b/src/IO/Archives/ZipArchiveWriter.h
index b2b77dce7e1..f4303e21f34 100644
--- a/src/IO/Archives/ZipArchiveWriter.h
+++ b/src/IO/Archives/ZipArchiveWriter.h
@@ -52,7 +52,7 @@ public:
     static constexpr const char kXz[] = "xz";
 
     /// Some compression levels.
-    enum class CompressionLevels
+    enum class CompressionLevels : int8_t
     {
         kDefault = kDefaultCompressionLevel,
         kFast = 2,
diff --git a/src/IO/CompressionMethod.h b/src/IO/CompressionMethod.h
index c10c4901d41..b970f4780c4 100644
--- a/src/IO/CompressionMethod.h
+++ b/src/IO/CompressionMethod.h
@@ -15,7 +15,7 @@ class WriteBuffer;
   *  (they use non-standard framing, indexes, checksums...)
   */
 
-enum class CompressionMethod
+enum class CompressionMethod : uint8_t
 {
     None,
     /// DEFLATE compression with gzip header and CRC32 checksum.
diff --git a/src/IO/FileEncryptionCommon.h b/src/IO/FileEncryptionCommon.h
index 87aa1194273..d77dcfb4258 100644
--- a/src/IO/FileEncryptionCommon.h
+++ b/src/IO/FileEncryptionCommon.h
@@ -18,7 +18,7 @@ namespace FileEncryption
 /// We chose to use CTR cipther algorithms because they have the following features which are important for us:
 /// - No right padding, so we can append encrypted files without deciphering;
 /// - One byte is always ciphered as one byte, so we get random access to encrypted files easily.
-enum class Algorithm
+enum class Algorithm : uint8_t
 {
     AES_128_CTR, /// Size of key is 16 bytes.
     AES_192_CTR, /// Size of key is 24 bytes.
diff --git a/src/IO/HadoopSnappyReadBuffer.h b/src/IO/HadoopSnappyReadBuffer.h
index b5fb1fec093..73e52f2c503 100644
--- a/src/IO/HadoopSnappyReadBuffer.h
+++ b/src/IO/HadoopSnappyReadBuffer.h
@@ -23,7 +23,7 @@ namespace DB
 class HadoopSnappyDecoder
 {
 public:
-    enum class Status : int
+    enum class Status : uint8_t
     {
         OK = 0,
         INVALID_INPUT = 1,
diff --git a/src/IO/ReadHelpers.h b/src/IO/ReadHelpers.h
index f349ab45cfe..d17fd15fcbd 100644
--- a/src/IO/ReadHelpers.h
+++ b/src/IO/ReadHelpers.h
@@ -329,7 +329,7 @@ inline ReturnType readBoolTextWord(bool & x, ReadBuffer & buf, bool support_uppe
     return ReturnType(true);
 }
 
-enum class ReadIntTextCheckOverflow
+enum class ReadIntTextCheckOverflow : uint8_t
 {
     DO_NOT_CHECK_OVERFLOW,
     CHECK_OVERFLOW,
diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index 6c44861eae3..e73a9054928 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -10,7 +10,7 @@
 
 namespace DB
 {
-enum class LocalFSReadMethod
+enum class LocalFSReadMethod : uint8_t
 {
     /**
      * Simple synchronous reads with 'read'.
@@ -54,7 +54,7 @@ enum class LocalFSReadMethod
     pread_fake_async
 };
 
-enum class RemoteFSReadMethod
+enum class RemoteFSReadMethod : uint8_t
 {
     read,
     threadpool,
diff --git a/src/IO/S3/PocoHTTPClient.h b/src/IO/S3/PocoHTTPClient.h
index a0b35e9b4a9..6cc5ec54c75 100644
--- a/src/IO/S3/PocoHTTPClient.h
+++ b/src/IO/S3/PocoHTTPClient.h
@@ -135,7 +135,7 @@ private:
         Aws::Utils::RateLimits::RateLimiterInterface * readLimiter,
         Aws::Utils::RateLimits::RateLimiterInterface * writeLimiter) const;
 
-    enum class S3MetricType
+    enum class S3MetricType : uint8_t
     {
         Microseconds,
         Count,
@@ -146,7 +146,7 @@ private:
         EnumSize,
     };
 
-    enum class S3MetricKind
+    enum class S3MetricKind : uint8_t
     {
         Read,
         Write,
diff --git a/src/Interpreters/ActionsDAG.h b/src/Interpreters/ActionsDAG.h
index 8c0bcf8fdc0..0bc0782dc76 100644
--- a/src/Interpreters/ActionsDAG.h
+++ b/src/Interpreters/ActionsDAG.h
@@ -51,7 +51,7 @@ class ActionsDAG
 {
 public:
 
-    enum class ActionType
+    enum class ActionType : uint8_t
     {
         /// Column which must be in input.
         INPUT,
@@ -288,7 +288,7 @@ public:
     /// Apply materialize() function to node. Result node has the same name.
     const Node & materializeNode(const Node & node);
 
-    enum class MatchColumnsMode
+    enum class MatchColumnsMode : uint8_t
     {
         /// Require same number of columns in source and result. Match columns by corresponding positions, regardless to names.
         Position,
diff --git a/src/Interpreters/ActionsVisitor.h b/src/Interpreters/ActionsVisitor.h
index 643bf50ecd4..046c7387ee8 100644
--- a/src/Interpreters/ActionsVisitor.h
+++ b/src/Interpreters/ActionsVisitor.h
@@ -78,7 +78,7 @@ class ASTIdentifier;
 class ASTFunction;
 class ASTLiteral;
 
-enum class GroupByKind
+enum class GroupByKind : uint8_t
 {
     NONE,
     ORDINARY,
diff --git a/src/Interpreters/AggregatedDataVariants.h b/src/Interpreters/AggregatedDataVariants.h
index 9f7185db9fc..99c136735e5 100644
--- a/src/Interpreters/AggregatedDataVariants.h
+++ b/src/Interpreters/AggregatedDataVariants.h
@@ -288,7 +288,7 @@ struct AggregatedDataVariants : private boost::noncopyable
         M(low_cardinality_key_string_two_level) \
         M(low_cardinality_key_fixed_string_two_level)
 
-    enum class Type
+    enum class Type : uint8_t
     {
         EMPTY = 0,
         without_key,
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index a8ee064877d..da14b43d276 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -48,7 +48,7 @@ public:
         Block insert_block{};
     };
 
-    enum class DataKind
+    enum class DataKind : uint8_t
     {
         Parsed = 0,
         Preprocessed = 1,
diff --git a/src/Interpreters/Cache/FileSegmentInfo.h b/src/Interpreters/Cache/FileSegmentInfo.h
index 3695be55865..1bd02f0e6ab 100644
--- a/src/Interpreters/Cache/FileSegmentInfo.h
+++ b/src/Interpreters/Cache/FileSegmentInfo.h
@@ -4,7 +4,7 @@
 
 namespace DB
 {
-    enum class FileSegmentState
+    enum class FileSegmentState : uint8_t
     {
         DOWNLOADED,
         /**
@@ -38,7 +38,7 @@ namespace DB
         DETACHED,
     };
 
-    enum class FileSegmentKind
+    enum class FileSegmentKind : uint8_t
     {
         /**
          * `Regular` file segment is still in cache after usage, and can be evicted
@@ -53,7 +53,7 @@ namespace DB
         Temporary,
     };
 
-    enum class FileCacheQueueEntryType
+    enum class FileCacheQueueEntryType : uint8_t
     {
         None,
         LRU,
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.h b/src/Interpreters/Cache/LRUFileCachePriority.h
index d31a3fb0f10..c5311e39718 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.h
+++ b/src/Interpreters/Cache/LRUFileCachePriority.h
@@ -108,7 +108,7 @@ private:
 
     LRUQueue::iterator remove(LRUQueue::iterator it, const CachePriorityGuard::Lock &);
 
-    enum class IterationResult
+    enum class IterationResult : uint8_t
     {
         BREAK,
         CONTINUE,
diff --git a/src/Interpreters/Cache/Metadata.h b/src/Interpreters/Cache/Metadata.h
index 31651149998..a5c8f3c0cf4 100644
--- a/src/Interpreters/Cache/Metadata.h
+++ b/src/Interpreters/Cache/Metadata.h
@@ -99,7 +99,7 @@ struct KeyMetadata : private std::map<size_t, FileSegmentMetadataPtr>,
         const CacheMetadata * cache_metadata_,
         bool created_base_directory_ = false);
 
-    enum class KeyState
+    enum class KeyState : uint8_t
     {
         ACTIVE,
         REMOVING,
@@ -178,7 +178,7 @@ public:
 
     void iterate(IterateFunc && func, const UserID & user_id);
 
-    enum class KeyNotFoundPolicy
+    enum class KeyNotFoundPolicy : uint8_t
     {
         THROW,
         THROW_LOGICAL,
diff --git a/src/Interpreters/Cache/QueryCache.h b/src/Interpreters/Cache/QueryCache.h
index c1c6c394698..814cad37f82 100644
--- a/src/Interpreters/Cache/QueryCache.h
+++ b/src/Interpreters/Cache/QueryCache.h
@@ -30,7 +30,7 @@ bool astContainsSystemTables(ASTPtr ast, ContextPtr context);
 class QueryCache
 {
 public:
-    enum class Usage
+    enum class Usage : uint8_t
     {
         Unknown,  /// we don't know what what happened
         None,     /// query result neither written nor read into/from query cache
@@ -144,7 +144,7 @@ public:
 
         Writer(const Writer & other);
 
-        enum class ChunkType {Result, Totals, Extremes};
+        enum class ChunkType : uint8_t {Result, Totals, Extremes};
         void buffer(Chunk && chunk, ChunkType chunk_type);
 
         void finalizeWrite();
diff --git a/src/Interpreters/CancellationCode.h b/src/Interpreters/CancellationCode.h
index 69f77e012f3..41d31f12830 100644
--- a/src/Interpreters/CancellationCode.h
+++ b/src/Interpreters/CancellationCode.h
@@ -4,7 +4,7 @@ namespace DB
 {
 
 /// A result code for the KILL QUERY/KILL MUTATION statement.
-enum class CancellationCode
+enum class CancellationCode : uint8_t
 {
     NotFound = 0,                     /// already cancelled
     QueryIsNotInitializedYet = 1,
diff --git a/src/Interpreters/CollectJoinOnKeysVisitor.h b/src/Interpreters/CollectJoinOnKeysVisitor.h
index ff10db3beb5..5dda33a8b98 100644
--- a/src/Interpreters/CollectJoinOnKeysVisitor.h
+++ b/src/Interpreters/CollectJoinOnKeysVisitor.h
@@ -17,7 +17,7 @@ class TableJoin;
 
 namespace ASOF
 {
-    enum class Inequality;
+    enum class Inequality : uint8_t;
 }
 
 namespace ErrorCodes
@@ -25,7 +25,7 @@ namespace ErrorCodes
     extern const int INVALID_JOIN_ON_EXPRESSION;
 }
 
-enum class JoinIdentifierPos
+enum class JoinIdentifierPos : uint8_t
 {
     /// Position can't be established, identifier not resolved
     Unknown,
diff --git a/src/Interpreters/ComparisonGraph.h b/src/Interpreters/ComparisonGraph.h
index 200d4af38fc..e1c436a7e43 100644
--- a/src/Interpreters/ComparisonGraph.h
+++ b/src/Interpreters/ComparisonGraph.h
@@ -154,7 +154,7 @@ private:
         const Graph & reversed_graph, size_t v,
         OptionalIndices & components, size_t component);
 
-    enum class Path
+    enum class Path : uint8_t
     {
         GREATER,
         GREATER_OR_EQUAL,
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index d1ff5b4c2b2..a6ab503430b 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -61,7 +61,7 @@ struct QuotaUsage;
 class AccessFlags;
 struct AccessRightsElement;
 class AccessRightsElements;
-enum class RowPolicyFilterType;
+enum class RowPolicyFilterType : uint8_t;
 class EmbeddedDictionaries;
 class ExternalDictionariesLoader;
 class ExternalUserDefinedExecutableFunctionsLoader;
@@ -718,7 +718,7 @@ public:
     void addQueryAccessInfo(const QualifiedProjectionName & qualified_projection_name);
 
     /// Supported factories for records in query_log
-    enum class QueryLogFactories
+    enum class QueryLogFactories : uint8_t
     {
         AggregateFunction,
         AggregateFunctionCombinator,
@@ -1155,7 +1155,7 @@ public:
 
     ActionLocksManagerPtr getActionLocksManager() const;
 
-    enum class ApplicationType
+    enum class ApplicationType : uint8_t
     {
         SERVER,         /// The program is run as clickhouse-server daemon (default behavior)
         CLIENT,         /// clickhouse-client
diff --git a/src/Interpreters/FilesystemCacheLog.h b/src/Interpreters/FilesystemCacheLog.h
index c83ac4e62fd..27c616ff40c 100644
--- a/src/Interpreters/FilesystemCacheLog.h
+++ b/src/Interpreters/FilesystemCacheLog.h
@@ -15,7 +15,7 @@ namespace DB
 
 struct FilesystemCacheLogElement
 {
-    enum class CacheType
+    enum class CacheType : uint8_t
     {
         READ_FROM_CACHE,
         READ_FROM_FS_AND_DOWNLOADED_TO_CACHE,
diff --git a/src/Interpreters/FilesystemReadPrefetchesLog.h b/src/Interpreters/FilesystemReadPrefetchesLog.h
index 088613cbeac..b3eae87893b 100644
--- a/src/Interpreters/FilesystemReadPrefetchesLog.h
+++ b/src/Interpreters/FilesystemReadPrefetchesLog.h
@@ -10,7 +10,7 @@
 namespace DB
 {
 
-enum class FilesystemPrefetchState
+enum class FilesystemPrefetchState : uint8_t
 {
     USED,
     CANCELLED_WITH_SEEK,
diff --git a/src/Interpreters/GraceHashJoin.cpp b/src/Interpreters/GraceHashJoin.cpp
index 53d1f48c291..97ff84b6fb6 100644
--- a/src/Interpreters/GraceHashJoin.cpp
+++ b/src/Interpreters/GraceHashJoin.cpp
@@ -108,7 +108,7 @@ namespace
 
 class GraceHashJoin::FileBucket : boost::noncopyable
 {
-    enum class State : int
+    enum class State : uint8_t
     {
         WRITING_BLOCKS,
         JOINING_BLOCKS,
diff --git a/src/Interpreters/HashJoin.h b/src/Interpreters/HashJoin.h
index b7f41a7eb6b..454f38ce08b 100644
--- a/src/Interpreters/HashJoin.h
+++ b/src/Interpreters/HashJoin.h
@@ -253,7 +253,7 @@ public:
         M(key_string)                          \
         M(key_fixed_string)
 
-    enum class Type
+    enum class Type : uint8_t
     {
         EMPTY,
         CROSS,
diff --git a/src/Interpreters/IJoin.h b/src/Interpreters/IJoin.h
index a43e0fbaad1..7374348da50 100644
--- a/src/Interpreters/IJoin.h
+++ b/src/Interpreters/IJoin.h
@@ -27,7 +27,7 @@ using IBlocksStreamPtr = std::shared_ptr<IBlocksStream>;
 class IJoin;
 using JoinPtr = std::shared_ptr<IJoin>;
 
-enum class JoinPipelineType
+enum class JoinPipelineType : uint8_t
 {
     /*
      * Right stream processed first, then when join data structures are ready, the left stream is processed using it.
diff --git a/src/Interpreters/IdentifierSemantic.h b/src/Interpreters/IdentifierSemantic.h
index bddaf3ed769..df65284699f 100644
--- a/src/Interpreters/IdentifierSemantic.h
+++ b/src/Interpreters/IdentifierSemantic.h
@@ -25,7 +25,7 @@ struct IdentifierSemanticImpl
 /// Static class to manipulate IdentifierSemanticImpl via ASTIdentifier
 struct IdentifierSemantic
 {
-    enum class ColumnMatch
+    enum class ColumnMatch : uint8_t
     {
         NoMatch,
         ColumnName,       /// column qualified with column names list
diff --git a/src/Interpreters/InterpreterRenameQuery.h b/src/Interpreters/InterpreterRenameQuery.h
index 79a6c0ddef4..8d7a0332c6e 100644
--- a/src/Interpreters/InterpreterRenameQuery.h
+++ b/src/Interpreters/InterpreterRenameQuery.h
@@ -64,7 +64,7 @@ private:
     BlockIO executeToTables(const ASTRenameQuery & rename, const RenameDescriptions & descriptions, TableGuards & ddl_guards);
     BlockIO executeToDatabase(const ASTRenameQuery & rename, const RenameDescriptions & descriptions);
 
-    enum class RenameType
+    enum class RenameType : uint8_t
     {
         RenameTable,
         RenameDatabase
diff --git a/src/Interpreters/InterpreterSelectQuery.h b/src/Interpreters/InterpreterSelectQuery.h
index c307e457649..e89a1e5febf 100644
--- a/src/Interpreters/InterpreterSelectQuery.h
+++ b/src/Interpreters/InterpreterSelectQuery.h
@@ -200,7 +200,7 @@ private:
     /// Check if we can limit block size to read based on LIMIT clause
     UInt64 maxBlockSizeByLimit() const;
 
-    enum class Modificator
+    enum class Modificator : uint8_t
     {
         ROLLUP = 0,
         CUBE = 1,
diff --git a/src/Interpreters/JIT/CompileDAG.h b/src/Interpreters/JIT/CompileDAG.h
index 77a02230f55..13ec763b6fc 100644
--- a/src/Interpreters/JIT/CompileDAG.h
+++ b/src/Interpreters/JIT/CompileDAG.h
@@ -33,7 +33,7 @@ class CompileDAG
 {
 public:
 
-    enum class CompileType
+    enum class CompileType : uint8_t
     {
         INPUT = 0,
         CONSTANT = 1,
diff --git a/src/Interpreters/JIT/compileFunction.cpp b/src/Interpreters/JIT/compileFunction.cpp
index 31d3920ccfd..9ab710ae537 100644
--- a/src/Interpreters/JIT/compileFunction.cpp
+++ b/src/Interpreters/JIT/compileFunction.cpp
@@ -215,7 +215,7 @@ static void compileCreateAggregateStatesFunctions(llvm::Module & module, const s
     b.CreateRetVoid();
 }
 
-enum class AddIntoAggregateStatesPlacesArgumentType
+enum class AddIntoAggregateStatesPlacesArgumentType : uint8_t
 {
     SinglePlace,
     MultiplePlaces,
diff --git a/src/Interpreters/MergeJoin.h b/src/Interpreters/MergeJoin.h
index 4486c134d51..a93ab3e067f 100644
--- a/src/Interpreters/MergeJoin.h
+++ b/src/Interpreters/MergeJoin.h
@@ -15,7 +15,7 @@ class TableJoin;
 class MergeJoinCursor;
 struct MergeJoinEqualRange;
 class RowBitmaps;
-enum class JoinTableSide;
+enum class JoinTableSide : uint8_t;
 
 class MergeJoin : public IJoin
 {
diff --git a/src/Interpreters/S3QueueLog.h b/src/Interpreters/S3QueueLog.h
index a7adbf28b3d..19e69c39247 100644
--- a/src/Interpreters/S3QueueLog.h
+++ b/src/Interpreters/S3QueueLog.h
@@ -20,7 +20,7 @@ struct S3QueueLogElement
     std::string file_name;
     size_t rows_processed = 0;
 
-    enum class S3QueueStatus
+    enum class S3QueueStatus : uint8_t
     {
         Processed,
         Failed,
diff --git a/src/Interpreters/SetVariants.h b/src/Interpreters/SetVariants.h
index ff527102080..8c3f7f8f852 100644
--- a/src/Interpreters/SetVariants.h
+++ b/src/Interpreters/SetVariants.h
@@ -254,7 +254,7 @@ struct SetVariantsTemplate: public Variant
         APPLY_FOR_SET_VARIANTS(M)
     #undef M
 
-    enum class Type
+    enum class Type : uint8_t
     {
         EMPTY,
 
diff --git a/src/Interpreters/WhereConstraintsOptimizer.cpp b/src/Interpreters/WhereConstraintsOptimizer.cpp
index 5a0102f1ee7..979a4f4dbf5 100644
--- a/src/Interpreters/WhereConstraintsOptimizer.cpp
+++ b/src/Interpreters/WhereConstraintsOptimizer.cpp
@@ -27,7 +27,7 @@ WhereConstraintsOptimizer::WhereConstraintsOptimizer(
 namespace
 {
 
-enum class MatchState
+enum class MatchState : uint8_t
 {
     FULL_MATCH, /// a = b
     NOT_MATCH, /// a = not b
diff --git a/src/Interpreters/WindowDescription.h b/src/Interpreters/WindowDescription.h
index 05269c9d2c3..c26e4517c9a 100644
--- a/src/Interpreters/WindowDescription.h
+++ b/src/Interpreters/WindowDescription.h
@@ -30,8 +30,8 @@ struct WindowFunctionDescription
 
 struct WindowFrame
 {
-    enum class FrameType { ROWS, GROUPS, RANGE };
-    enum class BoundaryType { Unbounded, Current, Offset };
+    enum class FrameType : uint8_t { ROWS, GROUPS, RANGE };
+    enum class BoundaryType : uint8_t { Unbounded, Current, Offset };
 
     // This flag signifies that the frame properties were not set explicitly by
     // user, but the fields of this structure still have to contain proper values
diff --git a/src/Parsers/ASTAlterQuery.h b/src/Parsers/ASTAlterQuery.h
index 1799b75fce4..a3cab1688c2 100644
--- a/src/Parsers/ASTAlterQuery.h
+++ b/src/Parsers/ASTAlterQuery.h
@@ -235,7 +235,7 @@ protected:
 class ASTAlterQuery : public ASTQueryWithTableAndOutput, public ASTQueryWithOnCluster
 {
 public:
-    enum class AlterObjectType
+    enum class AlterObjectType : uint8_t
     {
         TABLE,
         DATABASE,
diff --git a/src/Parsers/ASTKillQueryQuery.h b/src/Parsers/ASTKillQueryQuery.h
index 20db5576fa4..89ba474e107 100644
--- a/src/Parsers/ASTKillQueryQuery.h
+++ b/src/Parsers/ASTKillQueryQuery.h
@@ -9,7 +9,7 @@ namespace DB
 class ASTKillQueryQuery : public ASTQueryWithOutput, public ASTQueryWithOnCluster
 {
 public:
-    enum class Type
+    enum class Type : uint8_t
     {
         Query,      /// KILL QUERY
         Mutation,   /// KILL MUTATION
diff --git a/src/Parsers/ASTSelectIntersectExceptQuery.h b/src/Parsers/ASTSelectIntersectExceptQuery.h
index db00fb3df87..d2e3b1a7172 100644
--- a/src/Parsers/ASTSelectIntersectExceptQuery.h
+++ b/src/Parsers/ASTSelectIntersectExceptQuery.h
@@ -14,7 +14,7 @@ public:
 
     ASTPtr clone() const override;
 
-    enum class Operator
+    enum class Operator : uint8_t
     {
         UNKNOWN,
         EXCEPT_ALL,
diff --git a/src/Parsers/ASTTablesInSelectQuery.h b/src/Parsers/ASTTablesInSelectQuery.h
index 39ef0b21f6d..f3f329ca2b6 100644
--- a/src/Parsers/ASTTablesInSelectQuery.h
+++ b/src/Parsers/ASTTablesInSelectQuery.h
@@ -85,7 +85,7 @@ struct ASTTableJoin : public IAST
 /// Specification of ARRAY JOIN.
 struct ASTArrayJoin : public IAST
 {
-    enum class Kind
+    enum class Kind : uint8_t
     {
         Inner,   /// If array is empty, row will not present (default).
         Left,    /// If array is empty, leave row with default values instead of array elements.
diff --git a/src/Parsers/Access/ASTSetRoleQuery.h b/src/Parsers/Access/ASTSetRoleQuery.h
index 1146205af2b..51cdedda29d 100644
--- a/src/Parsers/Access/ASTSetRoleQuery.h
+++ b/src/Parsers/Access/ASTSetRoleQuery.h
@@ -13,7 +13,7 @@ class ASTRolesOrUsersSet;
 class ASTSetRoleQuery : public IAST
 {
 public:
-    enum class Kind
+    enum class Kind : uint8_t
     {
         SET_ROLE,
         SET_ROLE_DEFAULT,
diff --git a/src/Parsers/ExpressionListParsers.cpp b/src/Parsers/ExpressionListParsers.cpp
index 007c2855a13..ee9e199b9b8 100644
--- a/src/Parsers/ExpressionListParsers.cpp
+++ b/src/Parsers/ExpressionListParsers.cpp
@@ -146,7 +146,7 @@ static bool parseOperator(IParser::Pos & pos, std::string_view op, Expected & ex
     return false;
 }
 
-enum class SubqueryFunctionType
+enum class SubqueryFunctionType : uint8_t
 {
     NONE,
     ANY,
@@ -457,7 +457,7 @@ namespace
 }
 
 
-enum class Action
+enum class Action : uint8_t
 {
     NONE,
     OPERAND,
@@ -468,7 +468,7 @@ enum class Action
   * Operators can be grouped into some type if they have similar behaviour.
   * Certain operators are unique in terms of their behaviour, so they are assigned a separate type.
   */
-enum class OperatorType
+enum class OperatorType : uint8_t
 {
     None,
     Comparison,
@@ -521,7 +521,7 @@ static std::shared_ptr<ASTFunction> makeASTFunction(Operator & op, Args &&... ar
     return ast_function;
 }
 
-enum class Checkpoint
+enum class Checkpoint : uint8_t
 {
     None,
     Interval,
diff --git a/src/Parsers/IParser.h b/src/Parsers/IParser.h
index 0ae862fee75..cb3684bfe5d 100644
--- a/src/Parsers/IParser.h
+++ b/src/Parsers/IParser.h
@@ -22,7 +22,7 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-enum class Highlight
+enum class Highlight : uint8_t
 {
     none = 0,
     keyword,
diff --git a/src/Parsers/IdentifierQuotingStyle.h b/src/Parsers/IdentifierQuotingStyle.h
index 5e31969f7fb..48be809fc8f 100644
--- a/src/Parsers/IdentifierQuotingStyle.h
+++ b/src/Parsers/IdentifierQuotingStyle.h
@@ -6,7 +6,7 @@ namespace DB
 
 /// Method to quote identifiers.
 /// NOTE There could be differences in escaping rules inside quotes. Escaping rules may not match that required by specific external DBMS.
-enum class IdentifierQuotingStyle
+enum class IdentifierQuotingStyle : uint8_t
 {
     None,            /// Write as-is, without quotes.
     Backticks,       /// `clickhouse` style
diff --git a/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.h b/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.h
index f5069e80745..b518c6fb88d 100644
--- a/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.h
+++ b/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.h
@@ -28,7 +28,7 @@ private:
 class IParserKQLFunction
 {
 public:
-    enum class ArgumentState
+    enum class ArgumentState : uint8_t
     {
         Parsed,
         Raw
diff --git a/src/Parsers/Lexer.h b/src/Parsers/Lexer.h
index e228dba6c1f..6f31d56292d 100644
--- a/src/Parsers/Lexer.h
+++ b/src/Parsers/Lexer.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <stddef.h>
+#include <cstdint>
 
 
 namespace DB
@@ -75,7 +76,7 @@ namespace DB
     M(ErrorMaxQuerySizeExceeded) \
 
 
-enum class TokenType
+enum class TokenType : uint8_t
 {
 #define M(TOKEN) TOKEN,
 APPLY_FOR_TOKENS(M)
diff --git a/src/Parsers/LiteralEscapingStyle.h b/src/Parsers/LiteralEscapingStyle.h
index 10d4d84a85d..5c3e79038ae 100644
--- a/src/Parsers/LiteralEscapingStyle.h
+++ b/src/Parsers/LiteralEscapingStyle.h
@@ -5,7 +5,7 @@ namespace DB
 {
 
 /// Method to escape single quotes.
-enum class LiteralEscapingStyle
+enum class LiteralEscapingStyle : uint8_t
 {
     Regular,         /// Escape backslashes with backslash (\\) and quotes with backslash (\')
     PostgreSQL,      /// Do not escape backslashes (\), escape quotes with quote ('')
diff --git a/src/Parsers/ParserSystemQuery.cpp b/src/Parsers/ParserSystemQuery.cpp
index 696cb65e5be..0545c3e5568 100644
--- a/src/Parsers/ParserSystemQuery.cpp
+++ b/src/Parsers/ParserSystemQuery.cpp
@@ -67,7 +67,7 @@ namespace ErrorCodes
     return true;
 }
 
-enum class SystemQueryTargetType
+enum class SystemQueryTargetType : uint8_t
 {
     Model,
     Function,
diff --git a/src/Parsers/SelectUnionMode.h b/src/Parsers/SelectUnionMode.h
index 5c72ce65eb2..fc0a766eb66 100644
--- a/src/Parsers/SelectUnionMode.h
+++ b/src/Parsers/SelectUnionMode.h
@@ -5,7 +5,7 @@
 
 namespace DB
 {
-enum class SelectUnionMode
+enum class SelectUnionMode : uint8_t
 {
     UNION_DEFAULT,
     UNION_ALL,
diff --git a/src/Processors/Executors/ExecutingGraph.h b/src/Processors/Executors/ExecutingGraph.h
index e6d41321edd..71dcd360a2c 100644
--- a/src/Processors/Executors/ExecutingGraph.h
+++ b/src/Processors/Executors/ExecutingGraph.h
@@ -64,7 +64,7 @@ public:
 
     /// Status for processor.
     /// Can be owning or not. Owning means that executor who set this status can change node's data and nobody else can.
-    enum class ExecStatus
+    enum class ExecStatus : uint8_t
     {
         Idle,  /// prepare returned NeedData or PortFull. Non-owning.
         Preparing,  /// some executor is preparing processor, or processor is in task_queue. Owning.
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
index 3e8069cba0d..341141dd633 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
@@ -205,7 +205,7 @@ private:
     };
 
     /// Some information about what methods to call from internal parser.
-    enum class ProcessingUnitType
+    enum class ProcessingUnitType : uint8_t
     {
         START,
         PLAIN,
diff --git a/src/Processors/Formats/Impl/ParquetBlockInputFormat.h b/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
index b5b884b5efa..fc7e8eef95f 100644
--- a/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
@@ -177,7 +177,7 @@ private:
         //               Paused
         //
         // If max_decoding_threads <= 1: NotStarted -> Complete.
-        enum class Status
+        enum class Status : uint8_t
         {
             NotStarted,
             Running,
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.h b/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
index f82a8c8ab64..0abafc896ff 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
@@ -49,7 +49,7 @@ private:
     ValuesBlockInputFormat(std::unique_ptr<PeekableReadBuffer> buf_, const Block & header_, const RowInputFormatParams & params_,
                            const FormatSettings & format_settings_);
 
-    enum class ParserType
+    enum class ParserType : uint8_t
     {
         Streaming,
         BatchTemplate,
diff --git a/src/Processors/IProcessor.h b/src/Processors/IProcessor.h
index 56b4509fe00..63f32d8deb7 100644
--- a/src/Processors/IProcessor.h
+++ b/src/Processors/IProcessor.h
@@ -134,7 +134,7 @@ public:
 
     virtual String getName() const = 0;
 
-    enum class Status
+    enum class Status : uint8_t
     {
         /// Processor needs some data at its inputs to proceed.
         /// You need to run another processor to generate required input and then call 'prepare' again.
diff --git a/src/Processors/QueryPlan/IQueryPlanStep.h b/src/Processors/QueryPlan/IQueryPlanStep.h
index ac5ea259d2e..daca88fcceb 100644
--- a/src/Processors/QueryPlan/IQueryPlanStep.h
+++ b/src/Processors/QueryPlan/IQueryPlanStep.h
@@ -32,7 +32,7 @@ public:
     bool has_single_port = false;
 
     /// Sorting scope. Please keep the mutual order (more strong mode should have greater value).
-    enum class SortScope
+    enum class SortScope : uint8_t
     {
         None   = 0,
         Chunk  = 1, /// Separate chunks are sorted
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.h b/src/Processors/QueryPlan/ReadFromMergeTree.h
index 95dc7d5b22c..f512ba9e0ae 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.h
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.h
@@ -60,8 +60,7 @@ struct UsefulSkipIndexes
 class ReadFromMergeTree final : public SourceStepWithFilter
 {
 public:
-
-    enum class IndexType
+    enum class IndexType : uint8_t
     {
         None,
         MinMax,
diff --git a/src/Processors/QueryPlan/SortingStep.h b/src/Processors/QueryPlan/SortingStep.h
index 393fdab2d3a..49dcf9f3121 100644
--- a/src/Processors/QueryPlan/SortingStep.h
+++ b/src/Processors/QueryPlan/SortingStep.h
@@ -11,7 +11,7 @@ namespace DB
 class SortingStep : public ITransformingStep
 {
 public:
-    enum class Type
+    enum class Type : uint8_t
     {
         Full,
         FinishSorting,
diff --git a/src/Processors/QueryPlan/TotalsHavingStep.h b/src/Processors/QueryPlan/TotalsHavingStep.h
index b60eab78b53..a81bc7bb1a9 100644
--- a/src/Processors/QueryPlan/TotalsHavingStep.h
+++ b/src/Processors/QueryPlan/TotalsHavingStep.h
@@ -8,7 +8,7 @@ namespace DB
 class ActionsDAG;
 using ActionsDAGPtr = std::shared_ptr<ActionsDAG>;
 
-enum class TotalsMode;
+enum class TotalsMode : uint8_t;
 
 /// Execute HAVING and calculate totals. See TotalsHavingTransform.
 class TotalsHavingStep : public ITransformingStep
diff --git a/src/Processors/ResizeProcessor.h b/src/Processors/ResizeProcessor.h
index 61e35c54364..8d26387c039 100644
--- a/src/Processors/ResizeProcessor.h
+++ b/src/Processors/ResizeProcessor.h
@@ -45,14 +45,14 @@ private:
     bool initialized = false;
     bool is_reading_started = false;
 
-    enum class OutputStatus
+    enum class OutputStatus : uint8_t
     {
         NotActive,
         NeedData,
         Finished,
     };
 
-    enum class InputStatus
+    enum class InputStatus : uint8_t
     {
         NotActive,
         HasData,
@@ -107,14 +107,14 @@ private:
     std::queue<UInt64> waiting_outputs;
     bool initialized = false;
 
-    enum class OutputStatus
+    enum class OutputStatus : uint8_t
     {
         NotActive,
         NeedData,
         Finished,
     };
 
-    enum class InputStatus
+    enum class InputStatus : uint8_t
     {
         NotActive,
         NeedData,
diff --git a/src/Processors/TTL/TTLUpdateInfoAlgorithm.h b/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
index b6aee6f7cb0..52cd1509567 100644
--- a/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
+++ b/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
@@ -5,7 +5,7 @@
 namespace DB
 {
 
-enum class TTLUpdateField
+enum class TTLUpdateField : uint8_t
 {
     COLUMNS_TTL,
     TABLE_TTL,
diff --git a/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.h b/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.h
index 0f5dab06fc9..8e15b04f37e 100644
--- a/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.h
+++ b/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.h
@@ -15,7 +15,7 @@ struct SetWithState : public Set
     using Set::Set;
 
     /// Flow: Creating -> Finished or Suspended
-    enum class State
+    enum class State : uint8_t
     {
         /// Set is not yet created,
         /// Creating processor continues to build set.
diff --git a/src/Processors/Transforms/ExceptionKeepingTransform.h b/src/Processors/Transforms/ExceptionKeepingTransform.h
index cec0e0eea31..000b5da798a 100644
--- a/src/Processors/Transforms/ExceptionKeepingTransform.h
+++ b/src/Processors/Transforms/ExceptionKeepingTransform.h
@@ -28,7 +28,7 @@ protected:
     OutputPort & output;
     Port::Data data;
 
-    enum class Stage
+    enum class Stage : uint8_t
     {
         Start,
         Consume,
diff --git a/src/Processors/Transforms/SortingTransform.h b/src/Processors/Transforms/SortingTransform.h
index d9a30699f92..376b616352a 100644
--- a/src/Processors/Transforms/SortingTransform.h
+++ b/src/Processors/Transforms/SortingTransform.h
@@ -94,7 +94,7 @@ protected:
     void removeConstColumns(Chunk & chunk);
     void enrichChunkWithConstants(Chunk & chunk);
 
-    enum class Stage
+    enum class Stage : uint8_t
     {
         Consume = 0,
         Generate,
diff --git a/src/Processors/Transforms/TotalsHavingTransform.h b/src/Processors/Transforms/TotalsHavingTransform.h
index 350956c9c6b..ab605b52d93 100644
--- a/src/Processors/Transforms/TotalsHavingTransform.h
+++ b/src/Processors/Transforms/TotalsHavingTransform.h
@@ -11,7 +11,7 @@ using ExpressionActionsPtr = std::shared_ptr<ExpressionActions>;
 
 class ActionsDAG;
 
-enum class TotalsMode;
+enum class TotalsMode : uint8_t;
 
 /** Takes blocks after grouping, with non-finalized aggregate functions.
   * Calculates total values according to totals_mode.
diff --git a/src/QueryPipeline/Pipe.h b/src/QueryPipeline/Pipe.h
index ec102605677..19fdbd77cb2 100644
--- a/src/QueryPipeline/Pipe.h
+++ b/src/QueryPipeline/Pipe.h
@@ -74,7 +74,7 @@ public:
         InputPort * totals_in, InputPort * extremes_in,
         OutputPort * totals_out, OutputPort * extremes_out);
 
-    enum class StreamType
+    enum class StreamType : uint8_t
     {
         Main = 0, /// Stream for query data. There may be several streams of this type.
         Totals,  /// Stream for totals. No more than one.
diff --git a/src/QueryPipeline/SizeLimits.h b/src/QueryPipeline/SizeLimits.h
index fc052714b0c..1c84f81a127 100644
--- a/src/QueryPipeline/SizeLimits.h
+++ b/src/QueryPipeline/SizeLimits.h
@@ -7,7 +7,7 @@ namespace DB
 {
 
 /// What to do if the limit is exceeded.
-enum class OverflowMode
+enum class OverflowMode : uint8_t
 {
     THROW     = 0,    /// Throw exception.
     BREAK     = 1,    /// Abort query execution, return what is.
diff --git a/src/QueryPipeline/StreamLocalLimits.h b/src/QueryPipeline/StreamLocalLimits.h
index 5df026e6e3d..86d18a1bff6 100644
--- a/src/QueryPipeline/StreamLocalLimits.h
+++ b/src/QueryPipeline/StreamLocalLimits.h
@@ -13,7 +13,7 @@ namespace DB
   *  It is checks max_{rows,bytes}_to_read in progress handler and use info from ProcessListElement::progress_in for this.
   *  Currently this check is performed only in leaf streams.
   */
-enum class LimitsMode
+enum class LimitsMode : uint8_t
 {
     LIMITS_CURRENT,
     LIMITS_TOTAL,
diff --git a/src/Storages/AlterCommands.h b/src/Storages/AlterCommands.h
index 55cba505584..46abffab8ad 100644
--- a/src/Storages/AlterCommands.h
+++ b/src/Storages/AlterCommands.h
@@ -54,7 +54,7 @@ struct AlterCommand
     };
 
     /// Which property user wants to remove from column
-    enum class RemoveProperty
+    enum class RemoveProperty : uint8_t
     {
         NO_PROPERTY,
         /// Default specifiers
diff --git a/src/Storages/ColumnDefault.h b/src/Storages/ColumnDefault.h
index af1be6f3bec..a2ca8da4678 100644
--- a/src/Storages/ColumnDefault.h
+++ b/src/Storages/ColumnDefault.h
@@ -9,7 +9,7 @@
 namespace DB
 {
 
-enum class ColumnDefaultKind
+enum class ColumnDefaultKind : uint8_t
 {
     Default,
     Materialized,
diff --git a/src/Storages/DataDestinationType.h b/src/Storages/DataDestinationType.h
index 4729019b5cb..a22f2bdb706 100644
--- a/src/Storages/DataDestinationType.h
+++ b/src/Storages/DataDestinationType.h
@@ -4,7 +4,7 @@
 namespace DB
 {
 
-enum class DataDestinationType
+enum class DataDestinationType : uint8_t
 {
     DISK,
     VOLUME,
diff --git a/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp b/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
index df1536f53fc..1f175bb889f 100644
--- a/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
+++ b/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
@@ -65,14 +65,14 @@ IcebergMetadata::IcebergMetadata(
 namespace
 {
 
-enum class ManifestEntryStatus
+enum class ManifestEntryStatus : uint8_t
 {
     EXISTING = 0,
     ADDED = 1,
     DELETED = 2,
 };
 
-enum class DataFileContent
+enum class DataFileContent : uint8_t
 {
     DATA = 0,
     POSITION_DELETES = 1,
diff --git a/src/Storages/FileLog/FileLogConsumer.h b/src/Storages/FileLog/FileLogConsumer.h
index e44bfeb1806..42473abba42 100644
--- a/src/Storages/FileLog/FileLogConsumer.h
+++ b/src/Storages/FileLog/FileLogConsumer.h
@@ -33,7 +33,7 @@ public:
     const String & getCurrentRecord() const { return current[-1].data; }
 
 private:
-    enum class BufferStatus
+    enum class BufferStatus : uint8_t
     {
         INIT,
         NO_RECORD_RETURNED,
diff --git a/src/Storages/FileLog/StorageFileLog.h b/src/Storages/FileLog/StorageFileLog.h
index 0434213c558..6c8dbb98cb8 100644
--- a/src/Storages/FileLog/StorageFileLog.h
+++ b/src/Storages/FileLog/StorageFileLog.h
@@ -63,7 +63,7 @@ public:
 
     const auto & getFormatName() const { return format_name; }
 
-    enum class FileStatus
+    enum class FileStatus : uint8_t
     {
         OPEN, /// First time open file after table start up.
         NO_CHANGE,
diff --git a/src/Storages/Hive/HiveFile.h b/src/Storages/Hive/HiveFile.h
index 601c7f2a310..536214e159f 100644
--- a/src/Storages/Hive/HiveFile.h
+++ b/src/Storages/Hive/HiveFile.h
@@ -35,7 +35,7 @@ public:
     using MinMaxIndex = IMergeTreeDataPart::MinMaxIndex;
     using MinMaxIndexPtr = std::shared_ptr<MinMaxIndex>;
 
-    enum class FileFormat
+    enum class FileFormat : uint8_t
     {
         RC_FILE,
         TEXT,
diff --git a/src/Storages/Hive/StorageHive.h b/src/Storages/Hive/StorageHive.h
index 67ef153af0e..ee4a3a791d6 100644
--- a/src/Storages/Hive/StorageHive.h
+++ b/src/Storages/Hive/StorageHive.h
@@ -68,7 +68,7 @@ private:
     using FileInfo = HiveMetastoreClient::FileInfo;
     using HiveTableMetadataPtr = HiveMetastoreClient::HiveTableMetadataPtr;
 
-    enum class PruneLevel
+    enum class PruneLevel : uint8_t
     {
         None, /// Do not prune
         Partition,
diff --git a/src/Storages/MergeTree/ActiveDataPartSet.h b/src/Storages/MergeTree/ActiveDataPartSet.h
index 3c644c89b8c..ca744b3ed2a 100644
--- a/src/Storages/MergeTree/ActiveDataPartSet.h
+++ b/src/Storages/MergeTree/ActiveDataPartSet.h
@@ -22,7 +22,7 @@ using Strings = std::vector<String>;
 class ActiveDataPartSet
 {
 public:
-    enum class AddPartOutcome
+    enum class AddPartOutcome : uint8_t
     {
         Added,
         HasCovering,
diff --git a/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h b/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h
index 5092fbdd864..5da2a714b02 100644
--- a/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h
+++ b/src/Storages/MergeTree/ApproximateNearestNeighborIndexesCommon.h
@@ -29,7 +29,7 @@ struct ApproximateNearestNeighborInformation
     using Embedding = std::vector<float>;
     Embedding reference_vector;
 
-    enum class Metric
+    enum class Metric : uint8_t
     {
         Unknown,
         L2,
@@ -40,7 +40,7 @@ struct ApproximateNearestNeighborInformation
     String column_name;
     UInt64 limit;
 
-    enum class Type
+    enum class Type : uint8_t
     {
         OrderBy,
         Where
diff --git a/src/Storages/MergeTree/BackgroundJobsAssignee.h b/src/Storages/MergeTree/BackgroundJobsAssignee.h
index 9369ebe9135..80ddead3e56 100644
--- a/src/Storages/MergeTree/BackgroundJobsAssignee.h
+++ b/src/Storages/MergeTree/BackgroundJobsAssignee.h
@@ -55,7 +55,7 @@ public:
     /// e.g. merges, mutations and fetches. The same will be for Plain MergeTree except there is no
     /// replication queue, so we will just scan parts and decide what to do.
     /// Moving operations are the same for all types of MergeTree and also have their own timetable.
-    enum class Type
+    enum class Type : uint8_t
     {
         DataProcessing,
         Moving
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index ba2ff2ed6fe..b23f5e419dc 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -51,7 +51,7 @@ class MergeTreeTransaction;
 struct MergeTreeReadTaskInfo;
 using MergeTreeReadTaskInfoPtr = std::shared_ptr<const MergeTreeReadTaskInfo>;
 
-enum class DataPartRemovalState
+enum class DataPartRemovalState : uint8_t
 {
     NOT_ATTEMPTED,
     VISIBLE_TO_TRANSACTIONS,
@@ -246,7 +246,7 @@ public:
     /// The common procedure is to ask the keeper with unlock request to release a references to the blobs.
     /// And then follow the keeper answer decide remove or preserve the blobs in that part from s3.
     /// However in some special cases Clickhouse can make a decision without asking keeper.
-    enum class BlobsRemovalPolicyForTemporaryParts
+    enum class BlobsRemovalPolicyForTemporaryParts : uint8_t
     {
         /// decision about removing blobs is determined by keeper, the common case
         ASK_KEEPER,
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index b685a9e2a0f..16453e35425 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -1945,7 +1945,7 @@ KeyCondition::Description KeyCondition::getDescription() const
     /// Build and optimize it simultaneously.
     struct Node
     {
-        enum class Type
+        enum class Type : uint8_t
         {
             /// Leaf, which is RPNElement.
             Leaf,
diff --git a/src/Storages/MergeTree/MergeAlgorithm.h b/src/Storages/MergeTree/MergeAlgorithm.h
index 9123182b71e..147fc4ea9cb 100644
--- a/src/Storages/MergeTree/MergeAlgorithm.h
+++ b/src/Storages/MergeTree/MergeAlgorithm.h
@@ -5,7 +5,7 @@
 namespace DB
 {
 /// Algorithm of Merge.
-enum class MergeAlgorithm
+enum class MergeAlgorithm : uint8_t
 {
     Undecided, /// Not running yet
     Horizontal, /// per-row merge of all columns
diff --git a/src/Storages/MergeTree/MergePlainMergeTreeTask.h b/src/Storages/MergeTree/MergePlainMergeTreeTask.h
index 5cc9c0e50d3..013da902dea 100644
--- a/src/Storages/MergeTree/MergePlainMergeTreeTask.h
+++ b/src/Storages/MergeTree/MergePlainMergeTreeTask.h
@@ -53,7 +53,7 @@ private:
     void prepare();
     void finish();
 
-    enum class State
+    enum class State : uint8_t
     {
         NEED_PREPARE,
         NEED_EXECUTE,
diff --git a/src/Storages/MergeTree/MergeTask.h b/src/Storages/MergeTree/MergeTask.h
index f6268886b14..c8b0662e3eb 100644
--- a/src/Storages/MergeTree/MergeTask.h
+++ b/src/Storages/MergeTree/MergeTask.h
@@ -289,7 +289,7 @@ private:
         bool need_sync{false};
         /// End dependencies from previous stages
 
-        enum class State
+        enum class State : uint8_t
         {
             NEED_PREPARE,
             NEED_EXECUTE,
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
index aad34bfb914..d2852a3a504 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
@@ -20,14 +20,14 @@ namespace DB
 
 class MergeProgressCallback;
 
-enum class SelectPartsDecision
+enum class SelectPartsDecision : uint8_t
 {
     SELECTED = 0,
     CANNOT_SELECT = 1,
     NOTHING_TO_MERGE = 2,
 };
 
-enum class ExecuteTTLType
+enum class ExecuteTTLType : uint8_t
 {
     NONE = 0,
     NORMAL = 1,
diff --git a/src/Storages/MergeTree/MergeTreeDataPartState.h b/src/Storages/MergeTree/MergeTreeDataPartState.h
index 5c4779f016e..1845b7976cc 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartState.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartState.h
@@ -15,7 +15,7 @@ namespace DB
   * Deleting -> Outdated:         if an ZooKeeper error occurred during the deletion, we will retry deletion
   * Active -> DeleteOnDestroy:    if part was moved to another disk
   */
-enum class MergeTreeDataPartState
+enum class MergeTreeDataPartState : uint8_t
 {
     Temporary,       /// the part is generating now, it is not in data_parts list
     PreActive,       /// the part is in data_parts, but not used for SELECTs
diff --git a/src/Storages/MergeTree/MergeTreeIOSettings.h b/src/Storages/MergeTree/MergeTreeIOSettings.h
index 12a83703148..562bfe7c439 100644
--- a/src/Storages/MergeTree/MergeTreeIOSettings.h
+++ b/src/Storages/MergeTree/MergeTreeIOSettings.h
@@ -13,7 +13,7 @@ namespace DB
 class MMappedFileCache;
 using MMappedFileCachePtr = std::shared_ptr<MMappedFileCache>;
 
-enum class CompactPartsReadMethod
+enum class CompactPartsReadMethod : uint8_t
 {
     SingleBuffer,
     MultiBuffer,
diff --git a/src/Storages/MergeTree/MergeTreePartsMover.h b/src/Storages/MergeTree/MergeTreePartsMover.h
index 43d8ebdd6d3..3cf270946d8 100644
--- a/src/Storages/MergeTree/MergeTreePartsMover.h
+++ b/src/Storages/MergeTree/MergeTreePartsMover.h
@@ -12,7 +12,7 @@
 namespace DB
 {
 
-enum class MovePartsOutcome
+enum class MovePartsOutcome : uint8_t
 {
     PartsMoved,
     NothingToMove,
diff --git a/src/Storages/MergeTree/MergeTreeReadTask.h b/src/Storages/MergeTree/MergeTreeReadTask.h
index c8bb501c0e8..07129f16d89 100644
--- a/src/Storages/MergeTree/MergeTreeReadTask.h
+++ b/src/Storages/MergeTree/MergeTreeReadTask.h
@@ -23,7 +23,7 @@ using MergeTreeReaderPtr = std::unique_ptr<IMergeTreeReader>;
 using VirtualFields = std::unordered_map<String, Field>;
 
 
-enum class MergeTreeReadType
+enum class MergeTreeReadType : uint8_t
 {
     /// By default, read will use MergeTreeReadPool and return pipe with num_streams outputs.
     /// If num_streams == 1, will read without pool, in order specified in parts.
diff --git a/src/Storages/MergeTree/MergeTreeSource.cpp b/src/Storages/MergeTree/MergeTreeSource.cpp
index 02b4768f5f2..fcf2dd76e3f 100644
--- a/src/Storages/MergeTree/MergeTreeSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSource.cpp
@@ -11,7 +11,7 @@ namespace DB
 struct MergeTreeSource::AsyncReadingState
 {
     /// NotStarted -> InProgress -> IsFinished -> NotStarted ...
-    enum class Stage
+    enum class Stage : uint8_t
     {
         NotStarted,
         InProgress,
diff --git a/src/Storages/MergeTree/MergeType.h b/src/Storages/MergeTree/MergeType.h
index ce9a40c5931..18f289531a5 100644
--- a/src/Storages/MergeTree/MergeType.h
+++ b/src/Storages/MergeTree/MergeType.h
@@ -11,7 +11,7 @@ namespace DB
 /// ReplicatedMergeTreeLogEntry.
 ///
 /// Order is important, don't try to change it.
-enum class MergeType
+enum class MergeType : uint8_t
 {
     /// Just regular merge
     Regular = 1,
diff --git a/src/Storages/MergeTree/MutatePlainMergeTreeTask.h b/src/Storages/MergeTree/MutatePlainMergeTreeTask.h
index ef11780a873..a5de3cc9ded 100644
--- a/src/Storages/MergeTree/MutatePlainMergeTreeTask.h
+++ b/src/Storages/MergeTree/MutatePlainMergeTreeTask.h
@@ -49,7 +49,7 @@ private:
 
     void prepare();
 
-    enum class State
+    enum class State : uint8_t
     {
         NEED_PREPARE,
         NEED_EXECUTE,
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 55d845dfbb9..7fc501fd13f 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -1233,7 +1233,7 @@ private:
     void constructTaskForProjectionPartsMerge();
     void finalize();
 
-    enum class State
+    enum class State : uint8_t
     {
         NEED_PREPARE,
         NEED_MUTATE_ORIGINAL_PART,
@@ -1689,7 +1689,7 @@ private:
         ctx->out.reset();
     }
 
-    enum class State
+    enum class State : uint8_t
     {
         NEED_PREPARE,
         NEED_EXECUTE,
@@ -1938,8 +1938,7 @@ private:
         MutationHelpers::finalizeMutatedPart(ctx->source_part, ctx->new_data_part, ctx->execute_ttl_type, ctx->compression_codec, ctx->context, ctx->metadata_snapshot, ctx->need_sync);
     }
 
-
-    enum class State
+    enum class State : uint8_t
     {
         NEED_PREPARE,
         NEED_EXECUTE,
diff --git a/src/Storages/MergeTree/MutateTask.h b/src/Storages/MergeTree/MutateTask.h
index dc21df018d7..dc22b90f0e9 100644
--- a/src/Storages/MergeTree/MutateTask.h
+++ b/src/Storages/MergeTree/MutateTask.h
@@ -51,7 +51,7 @@ private:
 
     bool prepare();
 
-    enum class State
+    enum class State : uint8_t
     {
         NEED_PREPARE,
         NEED_EXECUTE
diff --git a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
index 7d9691b847d..99ad8aa085d 100644
--- a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
+++ b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
@@ -291,7 +291,7 @@ private:
 
     void setProgressCallback();
 
-    enum class ScanMode
+    enum class ScanMode : uint8_t
     {
         /// Main working set for the replica
         TakeWhatsMineByHash,
diff --git a/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.h b/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.h
index 2b1fcec62a8..79290c3939a 100644
--- a/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.h
+++ b/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.h
@@ -72,7 +72,7 @@ protected:
     ContextMutablePtr task_context;
 
 private:
-    enum class CheckExistingPartResult
+    enum class CheckExistingPartResult : uint8_t
     {
         PART_EXISTS,
         OK
@@ -81,7 +81,7 @@ private:
     CheckExistingPartResult checkExistingPart();
     bool executeImpl();
 
-    enum class State
+    enum class State : uint8_t
     {
         NEED_PREPARE,
         NEED_EXECUTE_INNER_MERGE,
diff --git a/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.h b/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.h
index 972c03e50d8..331c55cdacf 100644
--- a/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.h
+++ b/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.h
@@ -110,7 +110,7 @@ private:
     static void insertDefaultValue(StorageData & storage_data, size_t column_idx);
     void insertValue(StorageData & storage_data, const std::string & value, size_t column_idx);
 
-    enum class PostgreSQLQuery
+    enum class PostgreSQLQuery : uint8_t
     {
         INSERT,
         UPDATE,
diff --git a/src/Storages/ProjectionsDescription.h b/src/Storages/ProjectionsDescription.h
index 30af80d6d85..75a97697e00 100644
--- a/src/Storages/ProjectionsDescription.h
+++ b/src/Storages/ProjectionsDescription.h
@@ -22,7 +22,7 @@ using StorageMetadataPtr = std::shared_ptr<const StorageInMemoryMetadata>;
 /// Description of projections for Storage
 struct ProjectionDescription
 {
-    enum class Type
+    enum class Type : uint8_t
     {
         Normal,
         Aggregate,
diff --git a/src/Storages/RabbitMQ/RabbitMQConsumer.h b/src/Storages/RabbitMQ/RabbitMQConsumer.h
index 33d7173c840..d319fb8830c 100644
--- a/src/Storages/RabbitMQ/RabbitMQConsumer.h
+++ b/src/Storages/RabbitMQ/RabbitMQConsumer.h
@@ -98,7 +98,7 @@ private:
     String channel_id;
     UInt64 channel_id_counter = 0;
 
-    enum class State
+    enum class State : uint8_t
     {
         NONE,
         INITIALIZING,
diff --git a/src/Storages/RedisCommon.h b/src/Storages/RedisCommon.h
index 4cc358e6536..a94e1245d73 100644
--- a/src/Storages/RedisCommon.h
+++ b/src/Storages/RedisCommon.h
@@ -16,7 +16,7 @@ namespace DB
 static constexpr size_t REDIS_MAX_BLOCK_SIZE = DEFAULT_BLOCK_SIZE;
 static constexpr size_t REDIS_LOCK_ACQUIRE_TIMEOUT_MS = 5000;
 
-enum class RedisStorageType
+enum class RedisStorageType : uint8_t
 {
     SIMPLE,
     HASH_MAP,
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index 9301ea7ceb8..8ea9d8c3633 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -48,7 +48,7 @@ public:
 
     struct FileStatus
     {
-        enum class State
+        enum class State : uint8_t
         {
             Processing,
             Processed,
@@ -145,7 +145,7 @@ private:
     void setFileProcessedForOrderedModeImpl(
         const std::string & path, ProcessingNodeHolderPtr holder, const std::string & processed_node_path);
 
-    enum class SetFileProcessingResult
+    enum class SetFileProcessingResult : uint8_t
     {
         Success,
         ProcessingByOtherNode,
diff --git a/src/Storages/StorageDictionary.h b/src/Storages/StorageDictionary.h
index a414e4586d9..17e4efda2cd 100644
--- a/src/Storages/StorageDictionary.h
+++ b/src/Storages/StorageDictionary.h
@@ -20,7 +20,7 @@ friend class TableFunctionDictionary;
 
 public:
     /// Specifies where the table is located relative to the dictionary.
-    enum class Location
+    enum class Location : uint8_t
     {
         /// Table was created automatically as an element of a database with the Dictionary engine.
         DictionaryDatabase,
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 3902330195f..919118b283f 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -3768,7 +3768,7 @@ void StorageReplicatedMergeTree::mergeSelectingTask()
     const Names deduplicate_by_columns = {};
     CreateMergeEntryResult create_result = CreateMergeEntryResult::Other;
 
-    enum class AttemptStatus
+    enum class AttemptStatus : uint8_t
     {
         EntryCreated,
         NeedRetry,
diff --git a/src/Storages/StorageReplicatedMergeTree.h b/src/Storages/StorageReplicatedMergeTree.h
index 4bb6777dca8..9d086e1dc37 100644
--- a/src/Storages/StorageReplicatedMergeTree.h
+++ b/src/Storages/StorageReplicatedMergeTree.h
@@ -723,7 +723,7 @@ private:
       * Call when merge_selecting_mutex is locked.
       * Returns false if any part is not in ZK.
       */
-    enum class CreateMergeEntryResult { Ok, MissingPart, LogUpdated, Other };
+    enum class CreateMergeEntryResult : uint8_t { Ok, MissingPart, LogUpdated, Other };
 
     CreateMergeEntryResult createLogEntryToMergeParts(
         zkutil::ZooKeeperPtr & zookeeper,
diff --git a/src/Storages/System/StorageSystemDDLWorkerQueue.cpp b/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
index 635686780a0..661a31ab7eb 100644
--- a/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
+++ b/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
@@ -20,7 +20,7 @@ namespace fs = std::filesystem;
 namespace DB
 {
 
-enum class Status
+enum class Status : uint8_t
 {
     INACTIVE,
     ACTIVE,
diff --git a/src/Storages/System/StorageSystemServerSettings.cpp b/src/Storages/System/StorageSystemServerSettings.cpp
index 2092f352779..2e848f68850 100644
--- a/src/Storages/System/StorageSystemServerSettings.cpp
+++ b/src/Storages/System/StorageSystemServerSettings.cpp
@@ -23,7 +23,7 @@ namespace CurrentMetrics
 namespace DB
 {
 
-enum class ChangeableWithoutRestart
+enum class ChangeableWithoutRestart : uint8_t
 {
     No,
     IncreaseOnly,
diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 604e29df0ec..14bd89b41ad 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -166,7 +166,7 @@ public:
 };
 
 /// Type of path to be fetched
-enum class ZkPathType
+enum class ZkPathType : uint8_t
 {
     Exact, /// Fetch all nodes under this path
     Prefix, /// Fetch all nodes starting with this prefix, recursively (multiple paths may match prefix)
diff --git a/src/Storages/TTLMode.h b/src/Storages/TTLMode.h
index 7f5fe0315c6..bbbdbee400a 100644
--- a/src/Storages/TTLMode.h
+++ b/src/Storages/TTLMode.h
@@ -4,7 +4,7 @@
 namespace DB
 {
 
-enum class TTLMode
+enum class TTLMode : uint8_t
 {
     DELETE,
     MOVE,

From 1d69518c4d87d6e063ff8000a7387a4bbff4250b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 9 May 2024 02:07:04 +0200
Subject: [PATCH 184/289] Useless changes

---
 .clang-tidy                                   |  8 +++++++
 base/base/getMemoryAmount.cpp                 |  3 +--
 base/base/hex.h                               |  2 +-
 programs/keeper-client/KeeperClient.cpp       |  5 +++-
 src/Analyzer/Identifier.h                     |  6 ++---
 src/Client/Connection.cpp                     |  2 +-
 src/Columns/ColumnLowCardinality.h            |  6 ++---
 src/Common/ArenaWithFreeLists.h               |  5 +++-
 src/Common/Base58.cpp                         |  8 +++----
 src/Common/DateLUTImpl.h                      | 10 +++-----
 src/Common/Exception.h                        |  2 +-
 src/Common/IFactoryWithAliases.h              |  3 +--
 src/Common/LoggingFormatStringHelpers.h       |  2 +-
 src/Common/OpenTelemetryTraceContext.h        | 10 ++++----
 src/Common/PODArray_fwd.h                     |  2 +-
 src/Common/ProfileEvents.h                    |  2 +-
 src/Common/StackTrace.h                       |  2 +-
 src/Common/Stopwatch.h                        |  6 ++++-
 src/Common/StringUtils/StringUtils.h          | 23 +++++++++++--------
 src/Common/futex.h                            |  4 ++--
 src/Common/intExp.h                           | 10 ++++----
 src/IO/ReadHelpers.h                          |  8 +++----
 src/IO/VarInt.h                               |  5 ++--
 src/IO/WriteBufferFromPocoSocket.h            |  4 ++--
 src/IO/WriteBufferFromVector.h                |  2 +-
 src/Interpreters/CancellationCode.h           |  2 +-
 src/Interpreters/Context_fwd.h                |  2 +-
 src/Interpreters/DDLWorker.cpp                |  2 +-
 src/Interpreters/OpenTelemetrySpanLog.cpp     | 10 ++++----
 src/Interpreters/ProcessList.h                |  4 ++--
 src/Interpreters/executeDDLQueryOnCluster.cpp |  2 +-
 src/Parsers/ASTSetQuery.h                     |  2 +-
 src/Server/GRPCServer.cpp                     |  2 +-
 src/Server/HTTP/HTTPServerResponse.h          | 11 ++++-----
 src/Server/HTTPHandler.cpp                    |  2 +-
 src/Server/TCPHandler.cpp                     |  2 +-
 src/Storages/StorageFile.h                    |  2 +-
 37 files changed, 99 insertions(+), 84 deletions(-)

diff --git a/.clang-tidy b/.clang-tidy
index dc1cebe9430..44690ee181f 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -123,6 +123,14 @@ Checks: [
   '-readability-uppercase-literal-suffix',
   '-readability-use-anyofallof',
 
+  # These are new in clang-18, and we have to sort them out:
+  '-readability-avoid-nested-conditional-operator',
+  '-modernize-use-designated-initializers',
+  '-performance-enum-size',
+  '-readability-redundant-inline-specifier',
+  '-readability-redundant-member-init',
+  '-bugprone-crtp-constructor-accessibility',
+
   '-zircon-*'
 ]
 
diff --git a/base/base/getMemoryAmount.cpp b/base/base/getMemoryAmount.cpp
index 3d01e301f45..f47cba9833d 100644
--- a/base/base/getMemoryAmount.cpp
+++ b/base/base/getMemoryAmount.cpp
@@ -77,8 +77,7 @@ uint64_t getMemoryAmountOrZero()
         {
             uint64_t limit_v1;
             if (limit_file_v1 >> limit_v1)
-                if (limit_v1 < memory_amount)
-                    memory_amount = limit_v1;
+                memory_amount = std::min(memory_amount, limit_v1);
         }
     }
 
diff --git a/base/base/hex.h b/base/base/hex.h
index d2ebcadbe56..5e88ce76386 100644
--- a/base/base/hex.h
+++ b/base/base/hex.h
@@ -146,7 +146,7 @@ namespace impl
             TUInt res;
             if constexpr (sizeof(TUInt) == 1)
             {
-                res = static_cast<UInt8>(unhexDigit(data[0])) * 0x10 + static_cast<UInt8>(unhexDigit(data[1]));
+                res = unhexDigit(data[0]) * 0x10 + unhexDigit(data[1]);
             }
             else if constexpr (sizeof(TUInt) == 2)
             {
diff --git a/programs/keeper-client/KeeperClient.cpp b/programs/keeper-client/KeeperClient.cpp
index 52d825f30e6..ebec337060c 100644
--- a/programs/keeper-client/KeeperClient.cpp
+++ b/programs/keeper-client/KeeperClient.cpp
@@ -86,7 +86,10 @@ std::vector<String> KeeperClient::getCompletions(const String & prefix) const
 void KeeperClient::askConfirmation(const String & prompt, std::function<void()> && callback)
 {
     if (!ask_confirmation)
-        return callback();
+    {
+        callback();
+        return;
+    }
 
     std::cout << prompt << " Continue?\n";
     waiting_confirmation = true;
diff --git a/src/Analyzer/Identifier.h b/src/Analyzer/Identifier.h
index cf64bcf8bfb..cbd8f5e7694 100644
--- a/src/Analyzer/Identifier.h
+++ b/src/Analyzer/Identifier.h
@@ -149,12 +149,12 @@ public:
 
     void popFirst()
     {
-        return popFirst(1);
+        popFirst(1);
     }
 
     void pop_front() /// NOLINT
     {
-        return popFirst();
+        popFirst();
     }
 
     void popLast(size_t parts_to_remove_size)
@@ -172,7 +172,7 @@ public:
 
     void popLast()
     {
-        return popLast(1);
+        popLast(1);
     }
 
     void pop_back() /// NOLINT
diff --git a/src/Client/Connection.cpp b/src/Client/Connection.cpp
index 30f16d26443..6e626c22527 100644
--- a/src/Client/Connection.cpp
+++ b/src/Client/Connection.cpp
@@ -649,7 +649,7 @@ void Connection::sendQuery(
     bool with_pending_data,
     std::function<void(const Progress &)>)
 {
-    OpenTelemetry::SpanHolder span("Connection::sendQuery()", OpenTelemetry::CLIENT);
+    OpenTelemetry::SpanHolder span("Connection::sendQuery()", OpenTelemetry::SpanKind::CLIENT);
     span.addAttribute("clickhouse.query_id", query_id_);
     span.addAttribute("clickhouse.query", query);
     span.addAttribute("target", [this] () { return this->getHost() + ":" + std::to_string(this->getPort()); });
diff --git a/src/Columns/ColumnLowCardinality.h b/src/Columns/ColumnLowCardinality.h
index e65cce4a1fb..d90087f2de5 100644
--- a/src/Columns/ColumnLowCardinality.h
+++ b/src/Columns/ColumnLowCardinality.h
@@ -100,7 +100,7 @@ public:
 
     void updateHashWithValue(size_t n, SipHash & hash) const override
     {
-        return getDictionary().updateHashWithValue(getIndexes().getUInt(n), hash);
+        getDictionary().updateHashWithValue(getIndexes().getUInt(n), hash);
     }
 
     void updateWeakHash32(WeakHash32 & hash) const override;
@@ -154,7 +154,7 @@ public:
 
     void getExtremes(Field & min, Field & max) const override
     {
-        return dictionary.getColumnUnique().getNestedColumn()->index(getIndexes(), 0)->getExtremes(min, max); /// TODO: optimize
+        dictionary.getColumnUnique().getNestedColumn()->index(getIndexes(), 0)->getExtremes(min, max); /// TODO: optimize
     }
 
     void reserve(size_t n) override { idx.reserve(n); }
@@ -208,7 +208,7 @@ public:
 
     void getIndicesOfNonDefaultRows(Offsets & indices, size_t from, size_t limit) const override
     {
-        return getIndexes().getIndicesOfNonDefaultRows(indices, from, limit);
+        getIndexes().getIndicesOfNonDefaultRows(indices, from, limit);
     }
 
     bool valuesHaveFixedSize() const override { return getDictionary().valuesHaveFixedSize(); }
diff --git a/src/Common/ArenaWithFreeLists.h b/src/Common/ArenaWithFreeLists.h
index 80b4a00241d..ddfe2fa1ebd 100644
--- a/src/Common/ArenaWithFreeLists.h
+++ b/src/Common/ArenaWithFreeLists.h
@@ -87,7 +87,10 @@ public:
     void free(char * ptr, const size_t size)
     {
         if (size > max_fixed_block_size)
-            return Allocator<false>::free(ptr, size);
+        {
+            Allocator<false>::free(ptr, size);
+            return;
+        }
 
         /// find list of required size
         const auto list_idx = findFreeListIndex(size);
diff --git a/src/Common/Base58.cpp b/src/Common/Base58.cpp
index 32289c23e91..082db626434 100644
--- a/src/Common/Base58.cpp
+++ b/src/Common/Base58.cpp
@@ -46,14 +46,14 @@ size_t encodeBase58(const UInt8 * src, size_t src_length, UInt8 * dst)
     size_t c_idx = idx >> 1;
     for (size_t i = 0; i < c_idx; ++i)
     {
-        char s = base58_encoding_alphabet[static_cast<UInt8>(dst[i])];
-        dst[i] = base58_encoding_alphabet[static_cast<UInt8>(dst[idx - (i + 1)])];
+        char s = base58_encoding_alphabet[dst[i]];
+        dst[i] = base58_encoding_alphabet[dst[idx - (i + 1)]];
         dst[idx - (i + 1)] = s;
     }
 
     if ((idx & 1))
     {
-        dst[c_idx] = base58_encoding_alphabet[static_cast<UInt8>(dst[c_idx])];
+        dst[c_idx] = base58_encoding_alphabet[dst[c_idx]];
     }
 
     return zeros + idx;
@@ -105,7 +105,7 @@ std::optional<size_t> decodeBase58(const UInt8 * src, size_t src_length, UInt8 *
         }
         for (size_t j = 0; j < idx; ++j)
         {
-            carry += static_cast<UInt8>(dst[j]) * 58;
+            carry += static_cast<UInt8>(dst[j] * 58);
             dst[j] = static_cast<UInt8>(carry & 0xFF);
             carry >>= 8;
         }
diff --git a/src/Common/DateLUTImpl.h b/src/Common/DateLUTImpl.h
index 9993e50b710..22b4b630ce5 100644
--- a/src/Common/DateLUTImpl.h
+++ b/src/Common/DateLUTImpl.h
@@ -1104,8 +1104,7 @@ public:
                 time -= values.amount_of_offset_change();
 
                 /// With cutoff at the time of the shift. Otherwise we may end up with something like 23:00 previous day.
-                if (time < values.time_at_offset_change())
-                    time = values.time_at_offset_change();
+                time = std::max<Time>(time, values.time_at_offset_change());
             }
         }
         else
@@ -1250,7 +1249,7 @@ public:
     DateComponents toDateComponents(Time t) const
     {
         const Values & values = getValues(t);
-        return { values.year, values.month, values.day_of_month };
+        return { .year = values.year, .month = values.month, .day = values.day_of_month };
     }
 
     DateTimeComponents toDateTimeComponents(Time t) const
@@ -1350,10 +1349,7 @@ public:
 
         UInt8 days_in_month = daysInMonth(year, month);
 
-        if (day_of_month > days_in_month)
-            day_of_month = days_in_month;
-
-        return day_of_month;
+        return std::min(day_of_month, days_in_month);
     }
 
     template <typename DateOrTime>
diff --git a/src/Common/Exception.h b/src/Common/Exception.h
index 73c50debf33..87ef7101cdc 100644
--- a/src/Common/Exception.h
+++ b/src/Common/Exception.h
@@ -238,7 +238,7 @@ public:
 
 private:
     int saved_errno;
-    std::optional<std::string> path{};
+    std::optional<std::string> path;
 
     const char * name() const noexcept override { return "DB::ErrnoException"; }
     const char * className() const noexcept override { return "DB::ErrnoException"; }
diff --git a/src/Common/IFactoryWithAliases.h b/src/Common/IFactoryWithAliases.h
index e406154f87f..74d4b6e3bcb 100644
--- a/src/Common/IFactoryWithAliases.h
+++ b/src/Common/IFactoryWithAliases.h
@@ -53,7 +53,7 @@ public:
         const auto & creator_map = getMap();
         const auto & case_insensitive_creator_map = getCaseInsensitiveMap();
 
-        auto real_name_lowercase = Poco::toLower(real_name);
+        String real_name_lowercase = Poco::toLower(real_name);
         if (!creator_map.contains(real_name) && !case_insensitive_creator_map.contains(real_name_lowercase))
             throw Exception(
                 ErrorCodes::LOGICAL_ERROR,
@@ -69,7 +69,6 @@ public:
     void registerAliasUnchecked(const String & alias_name, const String & real_name, CaseSensitiveness case_sensitiveness = CaseSensitive)
     {
         String alias_name_lowercase = Poco::toLower(alias_name);
-        String real_name_lowercase = Poco::toLower(real_name);
         const String factory_name = getFactoryName();
 
         if (case_sensitiveness == CaseInsensitive)
diff --git a/src/Common/LoggingFormatStringHelpers.h b/src/Common/LoggingFormatStringHelpers.h
index 3e64c8dfb8f..72ae3d5a355 100644
--- a/src/Common/LoggingFormatStringHelpers.h
+++ b/src/Common/LoggingFormatStringHelpers.h
@@ -74,7 +74,7 @@ PreformattedMessage FormatStringHelperImpl<Args...>::format(Args && ...args) con
 {
     std::vector<std::string> out_format_string_args;
     std::string msg_text = tryGetArgsAndFormat(out_format_string_args, fmt_str, std::forward<Args>(args)...);
-    return PreformattedMessage{msg_text, message_format_string, out_format_string_args};
+    return PreformattedMessage{.text = msg_text, .format_string = message_format_string, .format_string_args = out_format_string_args};
 }
 
 template <typename... Args>
diff --git a/src/Common/OpenTelemetryTraceContext.h b/src/Common/OpenTelemetryTraceContext.h
index 13e0d174ba6..137feee370c 100644
--- a/src/Common/OpenTelemetryTraceContext.h
+++ b/src/Common/OpenTelemetryTraceContext.h
@@ -15,7 +15,7 @@ namespace OpenTelemetry
 {
 
 /// See https://opentelemetry.io/docs/reference/specification/trace/api/#spankind
-enum SpanKind
+enum class SpanKind : uint8_t
 {
     /// Default value. Indicates that the span represents an internal operation within an application,
     /// as opposed to an operations with remote parents or children.
@@ -39,13 +39,13 @@ enum SpanKind
 
 struct Span
 {
-    UUID trace_id{};
+    UUID trace_id;
     UInt64 span_id = 0;
     UInt64 parent_span_id = 0;
     String operation_name;
     UInt64 start_time_us = 0;
     UInt64 finish_time_us = 0;
-    SpanKind kind = INTERNAL;
+    SpanKind kind = SpanKind::INTERNAL;
     Map attributes;
 
     /// Following methods are declared as noexcept to make sure they're exception safe.
@@ -79,7 +79,7 @@ enum TraceFlags : UInt8
 /// The runtime info we need to create new OpenTelemetry spans.
 struct TracingContext
 {
-    UUID trace_id{};
+    UUID trace_id;
     UInt64 span_id = 0;
     // The incoming tracestate header and the trace flags, we just pass them
     // downstream. See https://www.w3.org/TR/trace-context/
@@ -181,7 +181,7 @@ using TracingContextHolderPtr = std::unique_ptr<TracingContextHolder>;
 /// Once it's created or destructed, it automatically maitains the tracing context on the thread that it lives.
 struct SpanHolder : public Span
 {
-    explicit SpanHolder(std::string_view, SpanKind _kind = INTERNAL);
+    explicit SpanHolder(std::string_view, SpanKind _kind = SpanKind::INTERNAL);
     ~SpanHolder();
 
     /// Finish a span explicitly if needed.
diff --git a/src/Common/PODArray_fwd.h b/src/Common/PODArray_fwd.h
index 56e84d68285..d570a90e467 100644
--- a/src/Common/PODArray_fwd.h
+++ b/src/Common/PODArray_fwd.h
@@ -11,7 +11,7 @@
 namespace DB
 {
 
-inline constexpr size_t integerRoundUp(size_t value, size_t dividend)
+constexpr size_t integerRoundUp(size_t value, size_t dividend)
 {
     return ((value + dividend - 1) / dividend) * dividend;
 }
diff --git a/src/Common/ProfileEvents.h b/src/Common/ProfileEvents.h
index adf2adb9808..e670b8907d2 100644
--- a/src/Common/ProfileEvents.h
+++ b/src/Common/ProfileEvents.h
@@ -30,7 +30,7 @@ namespace ProfileEvents
     class Timer
     {
     public:
-        enum class Resolution : UInt64
+        enum class Resolution : UInt32
         {
             Nanoseconds = 1,
             Microseconds = 1000,
diff --git a/src/Common/StackTrace.h b/src/Common/StackTrace.h
index 61c27695f8a..06028c77034 100644
--- a/src/Common/StackTrace.h
+++ b/src/Common/StackTrace.h
@@ -51,7 +51,7 @@ public:
     explicit StackTrace(const ucontext_t & signal_context);
 
     /// Creates empty object for deferred initialization
-    explicit inline StackTrace(NoCapture) {}
+    explicit StackTrace(NoCapture) {}
 
     constexpr size_t getSize() const { return size; }
     constexpr size_t getOffset() const { return offset; }
diff --git a/src/Common/Stopwatch.h b/src/Common/Stopwatch.h
index d6864a476e1..3b9cda025d8 100644
--- a/src/Common/Stopwatch.h
+++ b/src/Common/Stopwatch.h
@@ -7,6 +7,9 @@
 #include <cassert>
 #include <atomic>
 #include <memory>
+#include <system_error>
+#include <cerrno>
+
 
 /// From clock_getres(2):
 ///
@@ -22,7 +25,8 @@ static constexpr clockid_t STOPWATCH_DEFAULT_CLOCK = CLOCK_MONOTONIC;
 inline UInt64 clock_gettime_ns(clockid_t clock_type = STOPWATCH_DEFAULT_CLOCK)
 {
     struct timespec ts;
-    clock_gettime(clock_type, &ts);
+    if (0 != clock_gettime(clock_type, &ts))
+        throw std::system_error(std::error_code(errno, std::system_category()));
     return UInt64(ts.tv_sec * 1000000000LL + ts.tv_nsec);
 }
 
diff --git a/src/Common/StringUtils/StringUtils.h b/src/Common/StringUtils/StringUtils.h
index 16fba0370f5..4958ecc9476 100644
--- a/src/Common/StringUtils/StringUtils.h
+++ b/src/Common/StringUtils/StringUtils.h
@@ -154,16 +154,6 @@ inline bool isPunctuationASCII(char c)
 }
 
 
-inline bool isValidIdentifier(std::string_view str)
-{
-    return !str.empty()
-        && isValidIdentifierBegin(str[0])
-        && std::all_of(str.begin() + 1, str.end(), isWordCharASCII)
-        /// NULL is not a valid identifier in SQL, any case.
-        && !(str.size() == strlen("null") && 0 == strncasecmp(str.data(), "null", strlen("null")));
-}
-
-
 inline bool isNumberSeparator(bool is_start_of_block, bool is_hex, const char * pos, const char * end)
 {
     if (*pos != '_')
@@ -329,3 +319,16 @@ constexpr bool containsGlobs(const std::string & str)
 {
     return str.find_first_of("*?{") != std::string::npos;
 }
+
+inline bool isValidIdentifier(std::string_view str)
+{
+    return !str.empty()
+        && isValidIdentifierBegin(str[0])
+        && std::all_of(str.begin() + 1, str.end(), isWordCharASCII)
+        /// NULL is not a valid identifier in SQL, any case.
+        && !(str.size() == strlen("null")
+            && toLowerIfAlphaASCII(str[0]) == 'n'
+            && toLowerIfAlphaASCII(str[1]) == 'u'
+            && toLowerIfAlphaASCII(str[2]) == 'l'
+            && toLowerIfAlphaASCII(str[3]) == 'l');
+}
diff --git a/src/Common/futex.h b/src/Common/futex.h
index 33279ff4831..f86cfacdc3d 100644
--- a/src/Common/futex.h
+++ b/src/Common/futex.h
@@ -40,12 +40,12 @@ inline void futexWakeAll(std::atomic<UInt32> & address)
      futexWake(&address, INT_MAX);
 }
 
-inline constexpr UInt32 lowerHalf(UInt64 value)
+constexpr UInt32 lowerHalf(UInt64 value)
 {
     return static_cast<UInt32>(value & 0xffffffffull);
 }
 
-inline constexpr UInt32 upperHalf(UInt64 value)
+constexpr UInt32 upperHalf(UInt64 value)
 {
     return static_cast<UInt32>(value >> 32ull);
 }
diff --git a/src/Common/intExp.h b/src/Common/intExp.h
index 25ae2a8a4b6..8084c79cf14 100644
--- a/src/Common/intExp.h
+++ b/src/Common/intExp.h
@@ -13,7 +13,7 @@ inline NO_SANITIZE_UNDEFINED uint64_t intExp2(int x)
     return 1ULL << x;
 }
 
-constexpr inline uint64_t intExp10(int x)
+constexpr uint64_t intExp10(int x)
 {
     if (x < 0)
         return 0;
@@ -37,7 +37,7 @@ constexpr inline uint64_t intExp10(int x)
 namespace common
 {
 
-constexpr inline int exp10_i32(int x)
+constexpr int exp10_i32(int x)
 {
     if (x < 0)
         return 0;
@@ -60,7 +60,7 @@ constexpr inline int exp10_i32(int x)
     return values[x];
 }
 
-constexpr inline int64_t exp10_i64(int x)
+constexpr int64_t exp10_i64(int x)
 {
     if (x < 0)
         return 0;
@@ -92,7 +92,7 @@ constexpr inline int64_t exp10_i64(int x)
     return values[x];
 }
 
-constexpr inline Int128 exp10_i128(int x)
+constexpr Int128 exp10_i128(int x)
 {
     if (x < 0)
         return 0;
@@ -241,7 +241,7 @@ inline Int256 exp10_i256(int x)
 
 /// intExp10 returning the type T.
 template <typename T>
-constexpr inline T intExp10OfSize(int x)
+constexpr T intExp10OfSize(int x)
 {
     if constexpr (sizeof(T) <= 4)
         return static_cast<T>(common::exp10_i32(x));
diff --git a/src/IO/ReadHelpers.h b/src/IO/ReadHelpers.h
index d17fd15fcbd..5cf7d3e5b66 100644
--- a/src/IO/ReadHelpers.h
+++ b/src/IO/ReadHelpers.h
@@ -232,7 +232,7 @@ inline bool checkStringCaseInsensitive(const String & s, ReadBuffer & buf)
 void assertStringCaseInsensitive(const char * s, ReadBuffer & buf);
 inline void assertStringCaseInsensitive(const String & s, ReadBuffer & buf)
 {
-    return assertStringCaseInsensitive(s.c_str(), buf);
+    assertStringCaseInsensitive(s.c_str(), buf);
 }
 
 /** Check that next character in buf matches first character of s.
@@ -910,7 +910,7 @@ inline ReturnType readUUIDTextImpl(UUID & uuid, ReadBuffer & buf)
 
 inline void readUUIDText(UUID & uuid, ReadBuffer & buf)
 {
-    return readUUIDTextImpl<void>(uuid, buf);
+    readUUIDTextImpl<void>(uuid, buf);
 }
 
 inline bool tryReadUUIDText(UUID & uuid, ReadBuffer & buf)
@@ -932,7 +932,7 @@ inline ReturnType readIPv4TextImpl(IPv4 & ip, ReadBuffer & buf)
 
 inline void readIPv4Text(IPv4 & ip, ReadBuffer & buf)
 {
-    return readIPv4TextImpl<void>(ip, buf);
+    readIPv4TextImpl<void>(ip, buf);
 }
 
 inline bool tryReadIPv4Text(IPv4 & ip, ReadBuffer & buf)
@@ -954,7 +954,7 @@ inline ReturnType readIPv6TextImpl(IPv6 & ip, ReadBuffer & buf)
 
 inline void readIPv6Text(IPv6 & ip, ReadBuffer & buf)
 {
-    return readIPv6TextImpl<void>(ip, buf);
+    readIPv6TextImpl<void>(ip, buf);
 }
 
 inline bool tryReadIPv6Text(IPv6 & ip, ReadBuffer & buf)
diff --git a/src/IO/VarInt.h b/src/IO/VarInt.h
index 6dce8008170..2c41ae0a9c5 100644
--- a/src/IO/VarInt.h
+++ b/src/IO/VarInt.h
@@ -109,8 +109,9 @@ inline void readVarUInt(UInt64 & x, ReadBuffer & istr)
 inline void readVarUInt(UInt64 & x, ReadBuffer & istr)
 {
     if (istr.buffer().end() - istr.position() >= 10)
-        return varint_impl::readVarUInt<false>(x, istr);
-    return varint_impl::readVarUInt<true>(x, istr);
+        varint_impl::readVarUInt<false>(x, istr);
+    else
+        varint_impl::readVarUInt<true>(x, istr);
 }
 
 inline void readVarUInt(UInt64 & x, std::istream & istr)
diff --git a/src/IO/WriteBufferFromPocoSocket.h b/src/IO/WriteBufferFromPocoSocket.h
index 9c5509aebd1..1f69dfc466c 100644
--- a/src/IO/WriteBufferFromPocoSocket.h
+++ b/src/IO/WriteBufferFromPocoSocket.h
@@ -37,11 +37,11 @@ protected:
     void socketSendBytes(const char * ptr, size_t size);
     void socketSendStr(const std::string & str)
     {
-        return socketSendBytes(str.data(), str.size());
+        socketSendBytes(str.data(), str.size());
     }
     void socketSendStr(const char * ptr)
     {
-        return socketSendBytes(ptr, strlen(ptr));
+        socketSendBytes(ptr, strlen(ptr));
     }
 
     Poco::Net::Socket & socket;
diff --git a/src/IO/WriteBufferFromVector.h b/src/IO/WriteBufferFromVector.h
index a2ecc34f1ab..1ea32af2968 100644
--- a/src/IO/WriteBufferFromVector.h
+++ b/src/IO/WriteBufferFromVector.h
@@ -71,7 +71,7 @@ private:
     {
         vector.resize(
             ((position() - reinterpret_cast<Position>(vector.data())) /// NOLINT
-                + sizeof(ValueType) - 1)  /// Align up.
+                + sizeof(ValueType) - 1)  /// Align up. /// NOLINT
             / sizeof(ValueType));
 
         /// Prevent further writes.
diff --git a/src/Interpreters/CancellationCode.h b/src/Interpreters/CancellationCode.h
index 41d31f12830..e37a7f13105 100644
--- a/src/Interpreters/CancellationCode.h
+++ b/src/Interpreters/CancellationCode.h
@@ -10,7 +10,7 @@ enum class CancellationCode : uint8_t
     QueryIsNotInitializedYet = 1,
     CancelCannotBeSent = 2,
     CancelSent = 3,
-    Unknown
+    Unknown = 255
 };
 
 }
diff --git a/src/Interpreters/Context_fwd.h b/src/Interpreters/Context_fwd.h
index c7928bbdbf3..d69ea6bc135 100644
--- a/src/Interpreters/Context_fwd.h
+++ b/src/Interpreters/Context_fwd.h
@@ -36,7 +36,7 @@ struct WithContextImpl
     WithContextImpl() = default;
     explicit WithContextImpl(Weak context_) : context(context_) {}
 
-    inline Shared getContext() const
+    Shared getContext() const
     {
         auto ptr = context.lock();
         if (!ptr) throw Exception(ErrorCodes::LOGICAL_ERROR, "Context has expired");
diff --git a/src/Interpreters/DDLWorker.cpp b/src/Interpreters/DDLWorker.cpp
index fd807d54eff..0082f9876ef 100644
--- a/src/Interpreters/DDLWorker.cpp
+++ b/src/Interpreters/DDLWorker.cpp
@@ -569,7 +569,7 @@ void DDLWorker::processTask(DDLTaskBase & task, const ZooKeeperPtr & zookeeper)
     OpenTelemetry::TracingContextHolder tracing_ctx_holder(__PRETTY_FUNCTION__,
         task.entry.tracing_context,
         this->context->getOpenTelemetrySpanLog());
-    tracing_ctx_holder.root_span.kind = OpenTelemetry::CONSUMER;
+    tracing_ctx_holder.root_span.kind = OpenTelemetry::SpanKind::CONSUMER;
 
     String active_node_path = task.getActiveNodePath();
     String finished_node_path = task.getFinishedNodePath();
diff --git a/src/Interpreters/OpenTelemetrySpanLog.cpp b/src/Interpreters/OpenTelemetrySpanLog.cpp
index aa11749f8a6..8d777c640c7 100644
--- a/src/Interpreters/OpenTelemetrySpanLog.cpp
+++ b/src/Interpreters/OpenTelemetrySpanLog.cpp
@@ -20,11 +20,11 @@ ColumnsDescription OpenTelemetrySpanLogElement::getColumnsDescription()
     auto span_kind_type = std::make_shared<DataTypeEnum8>(
         DataTypeEnum8::Values
         {
-            {"INTERNAL",    static_cast<Int8>(OpenTelemetry::INTERNAL)},
-            {"SERVER",      static_cast<Int8>(OpenTelemetry::SERVER)},
-            {"CLIENT",      static_cast<Int8>(OpenTelemetry::CLIENT)},
-            {"PRODUCER",    static_cast<Int8>(OpenTelemetry::PRODUCER)},
-            {"CONSUMER",    static_cast<Int8>(OpenTelemetry::CONSUMER)}
+            {"INTERNAL",    static_cast<Int8>(OpenTelemetry::SpanKind::INTERNAL)},
+            {"SERVER",      static_cast<Int8>(OpenTelemetry::SpanKind::SERVER)},
+            {"CLIENT",      static_cast<Int8>(OpenTelemetry::SpanKind::CLIENT)},
+            {"PRODUCER",    static_cast<Int8>(OpenTelemetry::SpanKind::PRODUCER)},
+            {"CONSUMER",    static_cast<Int8>(OpenTelemetry::SpanKind::CONSUMER)}
         }
     );
 
diff --git a/src/Interpreters/ProcessList.h b/src/Interpreters/ProcessList.h
index 19f9b9afdda..accb73e12df 100644
--- a/src/Interpreters/ProcessList.h
+++ b/src/Interpreters/ProcessList.h
@@ -143,14 +143,14 @@ protected:
     /// Container of PipelineExecutors to be cancelled when a cancelQuery is received
     std::unordered_map<PipelineExecutor *, ExecutorHolderPtr> executors;
 
-    enum QueryStreamsStatus
+    enum class QueryStreamsStatus : uint8_t
     {
         NotInitialized,
         Initialized,
         Released
     };
 
-    QueryStreamsStatus query_streams_status{NotInitialized};
+    QueryStreamsStatus query_streams_status{QueryStreamsStatus::NotInitialized};
 
     ProcessListForUser * user_process_list = nullptr;
 
diff --git a/src/Interpreters/executeDDLQueryOnCluster.cpp b/src/Interpreters/executeDDLQueryOnCluster.cpp
index fbcb57b6125..e372f036073 100644
--- a/src/Interpreters/executeDDLQueryOnCluster.cpp
+++ b/src/Interpreters/executeDDLQueryOnCluster.cpp
@@ -65,7 +65,7 @@ bool isSupportedAlterTypeForOnClusterDDLQuery(int type)
 
 BlockIO executeDDLQueryOnCluster(const ASTPtr & query_ptr_, ContextPtr context, const DDLQueryOnClusterParams & params)
 {
-    OpenTelemetry::SpanHolder span(__FUNCTION__, OpenTelemetry::PRODUCER);
+    OpenTelemetry::SpanHolder span(__FUNCTION__, OpenTelemetry::SpanKind::PRODUCER);
 
     if (context->getCurrentTransaction() && context->getSettingsRef().throw_on_unsupported_query_inside_transaction)
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "ON CLUSTER queries inside transactions are not supported");
diff --git a/src/Parsers/ASTSetQuery.h b/src/Parsers/ASTSetQuery.h
index 42d63944b4f..b52662b246e 100644
--- a/src/Parsers/ASTSetQuery.h
+++ b/src/Parsers/ASTSetQuery.h
@@ -39,7 +39,7 @@ public:
     QueryKind getQueryKind() const override { return QueryKind::Set; }
 
     void appendColumnName(WriteBuffer & ostr) const override;
-    void appendColumnNameWithoutAlias(WriteBuffer & ostr) const override { return appendColumnName(ostr); }
+    void appendColumnNameWithoutAlias(WriteBuffer & ostr) const override { appendColumnName(ostr); }
 };
 
 }
diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index 394bb4722f8..fb21f46301d 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -873,7 +873,7 @@ namespace
             query_context->getClientInfo().client_trace_context,
             query_context->getSettingsRef(),
             query_context->getOpenTelemetrySpanLog());
-        thread_trace_context->root_span.kind = OpenTelemetry::SERVER;
+        thread_trace_context->root_span.kind = OpenTelemetry::SpanKind::SERVER;
 
         /// Prepare for sending exceptions and logs.
         const Settings & settings = query_context->getSettingsRef();
diff --git a/src/Server/HTTP/HTTPServerResponse.h b/src/Server/HTTP/HTTPServerResponse.h
index af08467baeb..ac4f52e7766 100644
--- a/src/Server/HTTP/HTTPServerResponse.h
+++ b/src/Server/HTTP/HTTPServerResponse.h
@@ -132,12 +132,11 @@ protected:
     void nextImpl() override
     {
         if (chunked)
-            return nextImplChunked();
-
-        if (fixed_length)
-            return nextImplFixedLength();
-
-        WriteBufferFromPocoSocket::nextImpl();
+            nextImplChunked();
+        else if (fixed_length)
+            nextImplFixedLength();
+        else
+            WriteBufferFromPocoSocket::nextImpl();
     }
 
     void nextImplFixedLength()
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 4d29e4d6a87..ce80d0c22c6 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -1108,7 +1108,7 @@ void HTTPHandler::handleRequest(HTTPServerRequest & request, HTTPServerResponse
             client_trace_context,
             context->getSettingsRef(),
             context->getOpenTelemetrySpanLog());
-        thread_trace_context->root_span.kind = OpenTelemetry::SERVER;
+        thread_trace_context->root_span.kind = OpenTelemetry::SpanKind::SERVER;
         thread_trace_context->root_span.addAttribute("clickhouse.uri", request.getURI());
 
         response.setContentType("text/plain; charset=UTF-8");
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index ae2f150c4a1..aff9906d289 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -384,7 +384,7 @@ void TCPHandler::runImpl()
                 query_context->getClientInfo().client_trace_context,
                 query_context->getSettingsRef(),
                 query_context->getOpenTelemetrySpanLog());
-            thread_trace_context->root_span.kind = OpenTelemetry::SERVER;
+            thread_trace_context->root_span.kind = OpenTelemetry::SpanKind::SERVER;
 
             query_scope.emplace(query_context, /* fatal_error_callback */ [this]
             {
diff --git a/src/Storages/StorageFile.h b/src/Storages/StorageFile.h
index 945ee4f369f..f3c57ba88ed 100644
--- a/src/Storages/StorageFile.h
+++ b/src/Storages/StorageFile.h
@@ -100,7 +100,7 @@ public:
     {
         std::vector<std::string> paths_to_archives;
         std::string path_in_archive; // used when reading a single file from archive
-        IArchiveReader::NameFilter filter = {}; // used when files inside archive are defined with a glob
+        IArchiveReader::NameFilter filter; // used when files inside archive are defined with a glob
 
         bool isSingleFileRead() const
         {

From 27551ca3c7ec98eed6e3d65a6b049838bc01ff83 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <thevar1able@users.noreply.github.com>
Date: Thu, 9 May 2024 04:08:21 +0300
Subject: [PATCH 185/289] Add `jwcrypto` to integration tests runner

---
 docker/test/integration/runner/Dockerfile | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index 8297a7100d1..23d8a37d822 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -101,7 +101,8 @@ RUN python3 -m pip install --no-cache-dir \
     retry==0.9.2 \
     bs4==0.0.2 \
     lxml==5.1.0 \
-    urllib3==2.0.7
+    urllib3==2.0.7 \
+    jwcrypto==1.5.6
 # bs4, lxml are for cloud tests, do not delete
 
 # Hudi supports only spark 3.3.*, not 3.4

From 0d14a2c67ebe3f62b6bc344b0e609ad57d4d55d2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 9 May 2024 03:11:02 +0200
Subject: [PATCH 186/289] Useless changes

---
 .../library-bridge/LibraryBridgeHandlers.cpp  |  1 -
 programs/library-bridge/SharedLibrary.cpp     |  4 ++--
 programs/obfuscator/Obfuscator.cpp            |  7 ++-----
 programs/odbc-bridge/ODBCSource.cpp           |  3 +--
 src/Access/Common/AccessRightsElement.cpp     |  2 +-
 src/Access/Common/AllowedClientHosts.cpp      | 10 +++++-----
 src/AggregateFunctions/QuantileTDigest.h      |  3 +--
 src/Common/ArenaWithFreeLists.h               |  2 +-
 src/Common/DateLUTImpl.cpp                    |  3 +--
 src/Common/FST.h                              |  1 +
 src/Common/HashTable/HashMap.h                |  2 +-
 src/Common/Jemalloc.cpp                       |  4 ++--
 src/Common/LoggingFormatStringHelpers.cpp     |  2 +-
 src/Common/NetlinkMetricsProvider.cpp         |  2 +-
 src/Common/OptimizedRegularExpression.cpp     |  8 +++-----
 src/Common/PoolWithFailoverBase.h             |  3 +--
 src/Common/ProgressIndication.cpp             |  3 +--
 src/Common/QueryProfiler.cpp                  |  3 +--
 src/Common/Scheduler/ISchedulerNode.h         | 19 ++++++++++++++----
 src/Common/StudentTTest.cpp                   |  9 ++++-----
 src/Common/SymbolIndex.cpp                    |  3 +--
 src/Common/SystemLogBase.cpp                  |  3 +--
 src/Common/ThreadProfileEvents.h              |  3 ++-
 src/Coordination/KeeperDispatcher.h           |  4 ++--
 src/Core/BaseSettings.h                       |  4 ++--
 src/Core/BaseSettingsProgramOptions.h         |  4 ++--
 src/Core/PostgreSQLProtocol.h                 |  4 ++--
 src/DataTypes/DataTypeDecimalBase.h           |  2 +-
 src/Disks/IDisk.h                             |  2 --
 src/Disks/IDiskTransaction.h                  | 13 ++++++++----
 src/Disks/IO/ReadBufferFromRemoteFSGather.h   |  2 +-
 src/IO/Archives/LibArchiveReader.h            |  1 -
 src/IO/MMappedFileDescriptor.cpp              |  4 +---
 src/IO/PeekableReadBuffer.cpp                 |  4 +---
 src/IO/S3/Credentials.cpp                     |  2 +-
 src/IO/WriteBufferFromS3.cpp                  |  5 ++++-
 src/IO/WriteBufferFromS3.h                    |  2 +-
 src/Interpreters/Cache/LRUFileCachePriority.h |  1 +
 src/Interpreters/ExternalLoader.h             | 20 +++++++++----------
 src/Parsers/ASTBackupQuery.cpp                |  2 +-
 src/Parsers/ASTCheckQuery.h                   |  8 --------
 src/Parsers/IParser.cpp                       |  5 +----
 src/Parsers/Lexer.cpp                         |  2 +-
 src/Parsers/ParserBackupQuery.cpp             |  2 +-
 src/Parsers/makeASTForLogicalFunction.cpp     |  4 ++--
 45 files changed, 93 insertions(+), 104 deletions(-)

diff --git a/programs/library-bridge/LibraryBridgeHandlers.cpp b/programs/library-bridge/LibraryBridgeHandlers.cpp
index 26d887cfc98..8d116e537aa 100644
--- a/programs/library-bridge/LibraryBridgeHandlers.cpp
+++ b/programs/library-bridge/LibraryBridgeHandlers.cpp
@@ -284,7 +284,6 @@ void ExternalDictionaryLibraryBridgeRequestHandler::handleRequest(HTTPServerRequ
         else if (method == "extDict_loadIds")
         {
             LOG_DEBUG(log, "Getting diciontary ids for dictionary with id: {}", dictionary_id);
-            String ids_string;
             std::vector<uint64_t> ids = parseIdsFromBinary(request.getStream());
 
             auto library_handler = ExternalDictionaryLibraryHandlerFactory::instance().get(dictionary_id);
diff --git a/programs/library-bridge/SharedLibrary.cpp b/programs/library-bridge/SharedLibrary.cpp
index d70709474b5..7423f9b89f4 100644
--- a/programs/library-bridge/SharedLibrary.cpp
+++ b/programs/library-bridge/SharedLibrary.cpp
@@ -14,7 +14,7 @@ namespace ErrorCodes
 
 SharedLibrary::SharedLibrary(std::string_view path, int flags)
 {
-    handle = dlopen(path.data(), flags);
+    handle = dlopen(path.data(), flags); // NOLINT
     if (!handle)
         throw Exception(ErrorCodes::CANNOT_DLOPEN, "Cannot dlopen: ({})", dlerror()); // NOLINT(concurrency-mt-unsafe) // MT-Safe on Linux, see man dlerror
 
@@ -34,7 +34,7 @@ void * SharedLibrary::getImpl(std::string_view name, bool no_throw)
 {
     dlerror(); // NOLINT(concurrency-mt-unsafe) // MT-Safe on Linux, see man dlerror
 
-    auto * res = dlsym(handle, name.data());
+    auto * res = dlsym(handle, name.data()); // NOLINT
 
     if (char * error = dlerror()) // NOLINT(concurrency-mt-unsafe) // MT-Safe on Linux, see man dlerror
     {
diff --git a/programs/obfuscator/Obfuscator.cpp b/programs/obfuscator/Obfuscator.cpp
index b2bf942af4e..8035f053b41 100644
--- a/programs/obfuscator/Obfuscator.cpp
+++ b/programs/obfuscator/Obfuscator.cpp
@@ -674,8 +674,7 @@ private:
 
         if (pos + length > end)
             length = end - pos;
-        if (length > sizeof(CodePoint))
-            length = sizeof(CodePoint);
+        length = std::min(length, sizeof(CodePoint));
 
         CodePoint res = 0;
         memcpy(&res, pos, length);
@@ -883,9 +882,7 @@ public:
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error in markov model");
 
             size_t offset_from_begin_of_string = pos - data;
-            size_t determinator_sliding_window_size = params.determinator_sliding_window_size;
-            if (determinator_sliding_window_size > determinator_size)
-                determinator_sliding_window_size = determinator_size;
+            size_t determinator_sliding_window_size = std::min(params.determinator_sliding_window_size, determinator_size);
 
             size_t determinator_sliding_window_overflow = offset_from_begin_of_string + determinator_sliding_window_size > determinator_size
                 ? offset_from_begin_of_string + determinator_sliding_window_size - determinator_size : 0;
diff --git a/programs/odbc-bridge/ODBCSource.cpp b/programs/odbc-bridge/ODBCSource.cpp
index 7f0d47f7e2e..940970f36ab 100644
--- a/programs/odbc-bridge/ODBCSource.cpp
+++ b/programs/odbc-bridge/ODBCSource.cpp
@@ -119,8 +119,7 @@ void ODBCSource::insertValue(
             time_t time = 0;
             const DataTypeDateTime & datetime_type = assert_cast<const DataTypeDateTime &>(*data_type);
             readDateTimeText(time, in, datetime_type.getTimeZone());
-            if (time < 0)
-                time = 0;
+            time = std::max<time_t>(time, 0);
             column.insert(static_cast<UInt32>(time));
             break;
         }
diff --git a/src/Access/Common/AccessRightsElement.cpp b/src/Access/Common/AccessRightsElement.cpp
index 835f414df37..8d54265ec39 100644
--- a/src/Access/Common/AccessRightsElement.cpp
+++ b/src/Access/Common/AccessRightsElement.cpp
@@ -245,7 +245,7 @@ bool AccessRightsElements::sameOptions() const
 
 void AccessRightsElements::eraseNonGrantable()
 {
-    boost::range::remove_erase_if(*this, [](AccessRightsElement & element)
+    boost::range::remove_erase_if(*this, [](AccessRightsElement & element) // NOLINT
     {
         element.eraseNonGrantable();
         return element.empty();
diff --git a/src/Access/Common/AllowedClientHosts.cpp b/src/Access/Common/AllowedClientHosts.cpp
index bee0cdd7264..d5e2200811e 100644
--- a/src/Access/Common/AllowedClientHosts.cpp
+++ b/src/Access/Common/AllowedClientHosts.cpp
@@ -308,7 +308,7 @@ void AllowedClientHosts::removeAddress(const IPAddress & address)
     if (address.isLoopback())
         local_host = false;
     else
-        boost::range::remove_erase(addresses, address);
+        boost::range::remove_erase(addresses, address); // NOLINT
 }
 
 void AllowedClientHosts::addSubnet(const IPSubnet & subnet)
@@ -328,7 +328,7 @@ void AllowedClientHosts::removeSubnet(const IPSubnet & subnet)
     else if (subnet.isMaskAllBitsOne())
         removeAddress(subnet.getPrefix());
     else
-        boost::range::remove_erase(subnets, subnet);
+        boost::range::remove_erase(subnets, subnet); // NOLINT
 }
 
 void AllowedClientHosts::addName(const String & name)
@@ -344,7 +344,7 @@ void AllowedClientHosts::removeName(const String & name)
     if (boost::iequals(name, "localhost"))
         local_host = false;
     else
-        boost::range::remove_erase(names, name);
+        boost::range::remove_erase(names, name); // NOLINT
 }
 
 void AllowedClientHosts::addNameRegexp(const String & name_regexp)
@@ -364,7 +364,7 @@ void AllowedClientHosts::removeNameRegexp(const String & name_regexp)
     else if (name_regexp == ".*")
         any_host = false;
     else
-        boost::range::remove_erase(name_regexps, name_regexp);
+        boost::range::remove_erase(name_regexps, name_regexp); // NOLINT
 }
 
 void AllowedClientHosts::addLikePattern(const String & pattern)
@@ -384,7 +384,7 @@ void AllowedClientHosts::removeLikePattern(const String & pattern)
     else if ((pattern == "%") || (pattern == "0.0.0.0/0") || (pattern == "::/0"))
         any_host = false;
     else
-        boost::range::remove_erase(like_patterns, pattern);
+        boost::range::remove_erase(like_patterns, pattern); // NOLINT
 }
 
 void AllowedClientHosts::addLocalHost()
diff --git a/src/AggregateFunctions/QuantileTDigest.h b/src/AggregateFunctions/QuantileTDigest.h
index 979c3f2af15..9d84f079daa 100644
--- a/src/AggregateFunctions/QuantileTDigest.h
+++ b/src/AggregateFunctions/QuantileTDigest.h
@@ -234,8 +234,7 @@ public:
                 BetterFloat qr = (sum + l_count + r->count * 0.5) / count;
                 BetterFloat err2 = qr * (1 - qr);
 
-                if (err > err2)
-                    err = err2;
+                err = std::min(err, err2);
 
                 BetterFloat k = count_epsilon_4 * err;
 
diff --git a/src/Common/ArenaWithFreeLists.h b/src/Common/ArenaWithFreeLists.h
index ddfe2fa1ebd..29cf975efdf 100644
--- a/src/Common/ArenaWithFreeLists.h
+++ b/src/Common/ArenaWithFreeLists.h
@@ -132,7 +132,7 @@ public:
     void free(char * ptr, const size_t size)
     {
         std::lock_guard lock{mutex};
-        return ArenaWithFreeLists::free(ptr, size);
+        ArenaWithFreeLists::free(ptr, size);
     }
 
     /// Size of the allocated pool in bytes
diff --git a/src/Common/DateLUTImpl.cpp b/src/Common/DateLUTImpl.cpp
index 341e571e4eb..392ee64dcbf 100644
--- a/src/Common/DateLUTImpl.cpp
+++ b/src/Common/DateLUTImpl.cpp
@@ -253,8 +253,7 @@ namespace cctz_extension
 
             size_t Read(void * buf, size_t bytes) override
             {
-                if (bytes > size)
-                    bytes = size;
+                bytes = std::min(bytes, size);
                 memcpy(buf, data, bytes);
                 data += bytes;
                 size -= bytes;
diff --git a/src/Common/FST.h b/src/Common/FST.h
index e2a1cbb20cb..e5dcea2c8d8 100644
--- a/src/Common/FST.h
+++ b/src/Common/FST.h
@@ -11,6 +11,7 @@
 #include <base/types.h>
 #include <absl/container/flat_hash_map.h>
 
+
 namespace DB
 {
 /// Finite State Transducer is an efficient way to represent term dictionary.
diff --git a/src/Common/HashTable/HashMap.h b/src/Common/HashTable/HashMap.h
index f104fea72cb..a26797a687a 100644
--- a/src/Common/HashTable/HashMap.h
+++ b/src/Common/HashTable/HashMap.h
@@ -291,7 +291,7 @@ public:
           *  the compiler can not guess about this, and generates the `load`, `increment`, `store` code.
           */
         if (inserted)
-            new (&it->getMapped()) typename Cell::Mapped();
+            new (reinterpret_cast<void*>(&it->getMapped())) typename Cell::Mapped();
 
         return it->getMapped();
     }
diff --git a/src/Common/Jemalloc.cpp b/src/Common/Jemalloc.cpp
index 6514639e700..fbe2f62c944 100644
--- a/src/Common/Jemalloc.cpp
+++ b/src/Common/Jemalloc.cpp
@@ -67,7 +67,7 @@ std::string flushJemallocProfile(const std::string & file_prefix)
     checkJemallocProfilingEnabled();
     char * prefix_buffer;
     size_t prefix_size = sizeof(prefix_buffer);
-    int n = mallctl("opt.prof_prefix", &prefix_buffer, &prefix_size, nullptr, 0);
+    int n = mallctl("opt.prof_prefix", &prefix_buffer, &prefix_size, nullptr, 0); // NOLINT
     if (!n && std::string_view(prefix_buffer) != "jeprof")
     {
         LOG_TRACE(getLogger("SystemJemalloc"), "Flushing memory profile with prefix {}", prefix_buffer);
@@ -80,7 +80,7 @@ std::string flushJemallocProfile(const std::string & file_prefix)
     const auto * profile_dump_path_str = profile_dump_path.c_str();
 
     LOG_TRACE(getLogger("SystemJemalloc"), "Flushing memory profile to {}", profile_dump_path_str);
-    mallctl("prof.dump", nullptr, nullptr, &profile_dump_path_str, sizeof(profile_dump_path_str));
+    mallctl("prof.dump", nullptr, nullptr, &profile_dump_path_str, sizeof(profile_dump_path_str)); // NOLINT
     return profile_dump_path;
 }
 
diff --git a/src/Common/LoggingFormatStringHelpers.cpp b/src/Common/LoggingFormatStringHelpers.cpp
index 3e90526f76d..4cf57807b0b 100644
--- a/src/Common/LoggingFormatStringHelpers.cpp
+++ b/src/Common/LoggingFormatStringHelpers.cpp
@@ -27,7 +27,7 @@ void LogFrequencyLimiterIml::log(Poco::Message & message)
     SipHash hash;
     hash.update(logger->name());
     /// Format strings are compile-time constants, so they are uniquely identified by pointer and size
-    hash.update(pattern.data());
+    hash.update(reinterpret_cast<uintptr_t>(pattern.data()));
     hash.update(pattern.size());
 
     time_t now = time(nullptr);
diff --git a/src/Common/NetlinkMetricsProvider.cpp b/src/Common/NetlinkMetricsProvider.cpp
index 172fede525a..b12d81df45c 100644
--- a/src/Common/NetlinkMetricsProvider.cpp
+++ b/src/Common/NetlinkMetricsProvider.cpp
@@ -112,7 +112,7 @@ struct NetlinkMessage
 
             if (bytes_sent <= 0)
             {
-                if (errno == EAGAIN)
+                if (bytes_sent < 0 && errno == EAGAIN)
                     continue;
                 else
                     throw ErrnoException(ErrorCodes::NETLINK_ERROR, "Can't send a Netlink command");
diff --git a/src/Common/OptimizedRegularExpression.cpp b/src/Common/OptimizedRegularExpression.cpp
index b6852964efe..712cab80aff 100644
--- a/src/Common/OptimizedRegularExpression.cpp
+++ b/src/Common/OptimizedRegularExpression.cpp
@@ -40,8 +40,7 @@ size_t shortest_literal_length(const Literals & literals)
     if (literals.empty()) return 0;
     size_t shortest = std::numeric_limits<size_t>::max();
     for (const auto & lit : literals)
-        if (shortest > lit.literal.size())
-            shortest = lit.literal.size();
+        shortest = std::min(shortest, lit.literal.size());
     return shortest;
 }
 
@@ -451,7 +450,7 @@ try
 {
     Literals alternative_literals;
     Literal required_literal;
-    analyzeImpl(regexp_, regexp_.data(), required_literal, is_trivial, alternative_literals);
+    analyzeImpl(regexp_, regexp_.data(), required_literal, is_trivial, alternative_literals); // NOLINT
     required_substring = std::move(required_literal.literal);
     required_substring_is_prefix = required_literal.prefix;
     for (auto & lit : alternative_literals)
@@ -649,8 +648,7 @@ unsigned OptimizedRegularExpression::match(const char * subject, size_t subject_
     if (limit == 0)
         return 0;
 
-    if (limit > number_of_subpatterns + 1)
-        limit = number_of_subpatterns + 1;
+    limit = std::min(limit, number_of_subpatterns + 1);
 
     if (is_trivial)
     {
diff --git a/src/Common/PoolWithFailoverBase.h b/src/Common/PoolWithFailoverBase.h
index 8365e818840..2359137012c 100644
--- a/src/Common/PoolWithFailoverBase.h
+++ b/src/Common/PoolWithFailoverBase.h
@@ -228,8 +228,7 @@ PoolWithFailoverBase<TNestedPool>::getMany(
     std::vector<ShuffledPool> shuffled_pools = getShuffledPools(max_ignored_errors, get_priority);
 
     /// Limit `max_tries` value by `max_error_cap` to avoid unlimited number of retries
-    if (max_tries > max_error_cap)
-        max_tries = max_error_cap;
+    max_tries = std::min(max_tries, max_error_cap);
 
     /// We will try to get a connection from each pool until a connection is produced or max_tries is reached.
     std::vector<TryResult> try_results(shuffled_pools.size());
diff --git a/src/Common/ProgressIndication.cpp b/src/Common/ProgressIndication.cpp
index e9e923c50d7..7b07c72824a 100644
--- a/src/Common/ProgressIndication.cpp
+++ b/src/Common/ProgressIndication.cpp
@@ -163,8 +163,7 @@ void ProgressIndication::writeProgress(WriteBufferFromFileDescriptor & message)
         WriteBufferFromOwnString profiling_msg_builder;
 
         /// We don't want -0. that can appear due to rounding errors.
-        if (cpu_usage <= 0)
-            cpu_usage = 0;
+        cpu_usage = std::max(cpu_usage, 0.);
 
         profiling_msg_builder << "(" << fmt::format("{:.1f}", cpu_usage) << " CPU";
 
diff --git a/src/Common/QueryProfiler.cpp b/src/Common/QueryProfiler.cpp
index ca79b9433b5..4f72b4aba75 100644
--- a/src/Common/QueryProfiler.cpp
+++ b/src/Common/QueryProfiler.cpp
@@ -152,8 +152,7 @@ void Timer::createIfNecessary(UInt64 thread_id, int clock_type, int pause_signal
 void Timer::set(UInt32 period)
 {
     /// Too high frequency can introduce infinite busy loop of signal handlers. We will limit maximum frequency (with 1000 signals per second).
-    if (period < 1000000)
-        period = 1000000;
+    period = std::max<UInt32>(period, 1000000);
     /// Randomize offset as uniform random value from 0 to period - 1.
     /// It will allow to sample short queries even if timer period is large.
     /// (For example, with period of 1 second, query with 50 ms duration will be sampled with 1 / 20 probability).
diff --git a/src/Common/Scheduler/ISchedulerNode.h b/src/Common/Scheduler/ISchedulerNode.h
index 20c1f4332da..df8d86f379c 100644
--- a/src/Common/Scheduler/ISchedulerNode.h
+++ b/src/Common/Scheduler/ISchedulerNode.h
@@ -206,14 +206,25 @@ public:
         while (true)
         {
             if (!queue.empty())
-                return processQueue(std::move(lock));
-            if (postponed.empty())
+            {
+                processQueue(std::move(lock));
+                return;
+            }
+            else if (postponed.empty())
+            {
                 wait(lock);
+            }
             else
             {
                 if (postponed.front().key <= now())
-                    return processPostponed(std::move(lock));
-                waitUntil(lock, postponed.front().key);
+                {
+                    processPostponed(std::move(lock));
+                    return;
+                }
+                else
+                {
+                    waitUntil(lock, postponed.front().key);
+                }
             }
         }
     }
diff --git a/src/Common/StudentTTest.cpp b/src/Common/StudentTTest.cpp
index 03159dca2ca..6a3c7d7c014 100644
--- a/src/Common/StudentTTest.cpp
+++ b/src/Common/StudentTTest.cpp
@@ -21,11 +21,11 @@ namespace
         { 1.533, 2.132, 2.776, 3.747, 4.604, 7.173 },
         { 1.476, 2.015, 2.571, 3.365, 4.032, 5.893 },
         { 1.440, 1.943, 2.447, 3.143, 3.707, 5.208 },
-        { 1.415, 1.895, 2.365, 2.998, 3.499, 4.782 },
+        { 1.415, 1.895, 2.365, 2.998, 3.499, 4.782 }, // NOLINT
         { 1.397, 1.860, 2.306, 2.896, 3.355, 4.499 },
         { 1.383, 1.833, 2.262, 2.821, 3.250, 4.296 },
         { 1.372, 1.812, 2.228, 2.764, 3.169, 4.143 },
-        { 1.363, 1.796, 2.201, 2.718, 3.106, 4.024 },
+        { 1.363, 1.796, 2.201, 2.718, 3.106, 4.024 }, // NOLINT
         { 1.356, 1.782, 2.179, 2.681, 3.055, 3.929 },
         { 1.350, 1.771, 2.160, 2.650, 3.012, 3.852 },
         { 1.345, 1.761, 2.145, 2.624, 2.977, 3.787 },
@@ -50,7 +50,7 @@ namespace
         { 1.308, 1.692, 2.035, 2.445, 2.733, 3.356 },
         { 1.307, 1.691, 2.032, 2.441, 2.728, 3.348 },
         { 1.306, 1.690, 2.030, 2.438, 2.724, 3.340 },
-        { 1.306, 1.688, 2.028, 2.434, 2.719, 3.333 },
+        { 1.306, 1.688, 2.028, 2.434, 2.719, 3.333 }, // NOLINT
         { 1.305, 1.687, 2.026, 2.431, 2.715, 3.326 },
         { 1.304, 1.686, 2.024, 2.429, 2.712, 3.319 },
         { 1.304, 1.685, 2.023, 2.426, 2.708, 3.313 },
@@ -137,8 +137,7 @@ void StudentTTest::add(size_t distribution, double value)
 /// Confidence_level_index can be set in range [0, 5]. Corresponding values can be found above.
 std::pair<bool, std::string> StudentTTest::compareAndReport(size_t confidence_level_index) const
 {
-    if (confidence_level_index > 5)
-        confidence_level_index = 5;
+    confidence_level_index = std::min<size_t>(confidence_level_index, 5);
 
     if (data[0].size == 0 || data[1].size == 0)
         return {true, ""};
diff --git a/src/Common/SymbolIndex.cpp b/src/Common/SymbolIndex.cpp
index a2d58fc7e8c..f8ced95653b 100644
--- a/src/Common/SymbolIndex.cpp
+++ b/src/Common/SymbolIndex.cpp
@@ -141,8 +141,7 @@ void collectSymbolsFromProgramHeaders(
                     __msan_unpoison(buckets, hash[0] * sizeof(buckets[0]));
 
                     for (ElfW(Word) i = 0; i < hash[0]; ++i)
-                        if (buckets[i] > sym_cnt)
-                            sym_cnt = buckets[i];
+                        sym_cnt = std::max<size_t>(sym_cnt, buckets[i]);
 
                     if (sym_cnt)
                     {
diff --git a/src/Common/SystemLogBase.cpp b/src/Common/SystemLogBase.cpp
index 4dee6d905d9..15803db4929 100644
--- a/src/Common/SystemLogBase.cpp
+++ b/src/Common/SystemLogBase.cpp
@@ -86,8 +86,7 @@ void SystemLogQueue<LogElement>::push(LogElement&& element)
             // It is enough to only wake the flushing thread once, after the message
             // count increases past half available size.
             const uint64_t queue_end = queue_front_index + queue.size();
-            if (requested_flush_up_to < queue_end)
-                requested_flush_up_to = queue_end;
+            requested_flush_up_to = std::max(requested_flush_up_to, queue_end);
 
             flush_event.notify_all();
         }
diff --git a/src/Common/ThreadProfileEvents.h b/src/Common/ThreadProfileEvents.h
index a3f79bf4d78..26aeab08302 100644
--- a/src/Common/ThreadProfileEvents.h
+++ b/src/Common/ThreadProfileEvents.h
@@ -110,7 +110,8 @@ private:
     static inline UInt64 getClockMonotonic()
     {
         struct timespec ts;
-        clock_gettime(CLOCK_MONOTONIC, &ts);
+        if (0 != clock_gettime(CLOCK_MONOTONIC, &ts))
+            throw std::system_error(std::error_code(errno, std::system_category()));
         return ts.tv_sec * 1000000000ULL + ts.tv_nsec;
     }
 };
diff --git a/src/Coordination/KeeperDispatcher.h b/src/Coordination/KeeperDispatcher.h
index 231ef7e94e9..2e0c73131d5 100644
--- a/src/Coordination/KeeperDispatcher.h
+++ b/src/Coordination/KeeperDispatcher.h
@@ -244,12 +244,12 @@ public:
     /// Yield leadership and become follower.
     void yieldLeadership()
     {
-        return server->yieldLeadership();
+        server->yieldLeadership();
     }
 
     void recalculateStorageStats()
     {
-        return server->recalculateStorageStats();
+        server->recalculateStorageStats();
     }
 
     static void cleanResources();
diff --git a/src/Core/BaseSettings.h b/src/Core/BaseSettings.h
index 69c8c8bc240..adf7a41193c 100644
--- a/src/Core/BaseSettings.h
+++ b/src/Core/BaseSettings.h
@@ -22,8 +22,8 @@ class WriteBuffer;
 
 enum class SettingsWriteFormat : uint8_t
 {
-    BINARY,             /// Part of the settings are serialized as strings, and other part as variants. This is the old behaviour.
-    STRINGS_WITH_FLAGS, /// All settings are serialized as strings. Before each value the flag `is_important` is serialized.
+    BINARY = 0,             /// Part of the settings are serialized as strings, and other part as variants. This is the old behaviour.
+    STRINGS_WITH_FLAGS = 1, /// All settings are serialized as strings. Before each value the flag `is_important` is serialized.
     DEFAULT = STRINGS_WITH_FLAGS,
 };
 
diff --git a/src/Core/BaseSettingsProgramOptions.h b/src/Core/BaseSettingsProgramOptions.h
index 6c8166fc119..81f6c59a5e5 100644
--- a/src/Core/BaseSettingsProgramOptions.h
+++ b/src/Core/BaseSettingsProgramOptions.h
@@ -34,11 +34,11 @@ void addProgramOptionsAsMultitokens(T &cmd_settings, boost::program_options::opt
 /// Adds program options to set the settings from a command line.
 /// (Don't forget to call notify() on the `variables_map` after parsing it!)
 template <typename T>
-void addProgramOption(T &cmd_settings, boost::program_options::options_description & options, std::string_view name, const typename T::SettingFieldRef  & field)
+void addProgramOption(T & cmd_settings, boost::program_options::options_description & options, std::string_view name, const typename T::SettingFieldRef & field)
 {
     auto on_program_option = boost::function1<void, const std::string &>([&cmd_settings, name](const std::string & value) { cmd_settings.set(name, value); });
     options.add(boost::shared_ptr<boost::program_options::option_description>(new boost::program_options::option_description(
-            name.data(), boost::program_options::value<std::string>()->composing()->notifier(on_program_option), field.getDescription())));
+            name.data(), boost::program_options::value<std::string>()->composing()->notifier(on_program_option), field.getDescription()))); // NOLINT
 }
 
 template <typename T>
diff --git a/src/Core/PostgreSQLProtocol.h b/src/Core/PostgreSQLProtocol.h
index 7630fbb0b23..807e4a7187a 100644
--- a/src/Core/PostgreSQLProtocol.h
+++ b/src/Core/PostgreSQLProtocol.h
@@ -831,7 +831,7 @@ public:
         [[maybe_unused]] Messaging::MessageTransport & mt,
         const Poco::Net::SocketAddress & address) override
     {
-        return setPassword(user_name, "", session, address);
+        setPassword(user_name, "", session, address);
     }
 
     AuthenticationType getType() const override
@@ -855,7 +855,7 @@ public:
         if (type == Messaging::FrontMessageType::PASSWORD_MESSAGE)
         {
             std::unique_ptr<Messaging::PasswordMessage> password = mt.receive<Messaging::PasswordMessage>();
-            return setPassword(user_name, password->password, session, address);
+            setPassword(user_name, password->password, session, address);
         }
         else
             throw Exception(ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT,
diff --git a/src/DataTypes/DataTypeDecimalBase.h b/src/DataTypes/DataTypeDecimalBase.h
index 9887dfabcdb..642d2de833f 100644
--- a/src/DataTypes/DataTypeDecimalBase.h
+++ b/src/DataTypes/DataTypeDecimalBase.h
@@ -195,7 +195,7 @@ inline DataTypePtr createDecimal(UInt64 precision_value, UInt64 scale_value)
         throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND, "Wrong precision: it must be between {} and {}, got {}",
                         DecimalUtils::min_precision, DecimalUtils::max_precision<Decimal256>, precision_value);
 
-    if (static_cast<UInt64>(scale_value) > precision_value)
+    if (scale_value > precision_value)
         throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND, "Negative scales and scales larger than precision are not supported");
 
     if (precision_value <= DecimalUtils::max_precision<Decimal32>)
diff --git a/src/Disks/IDisk.h b/src/Disks/IDisk.h
index b84d60c4591..614fe413503 100644
--- a/src/Disks/IDisk.h
+++ b/src/Disks/IDisk.h
@@ -12,7 +12,6 @@
 #include <Disks/ObjectStorages/IObjectStorage.h>
 #include <Disks/WriteMode.h>
 #include <Disks/DirectoryIterator.h>
-#include <Disks/IDiskTransaction.h>
 
 #include <memory>
 #include <mutex>
@@ -55,7 +54,6 @@ using DisksMap = std::map<String, DiskPtr>;
 
 class IReservation;
 using ReservationPtr = std::unique_ptr<IReservation>;
-using Reservations = std::vector<ReservationPtr>;
 
 class ReadBufferFromFileBase;
 class WriteBufferFromFileBase;
diff --git a/src/Disks/IDiskTransaction.h b/src/Disks/IDiskTransaction.h
index 7df1b71eb2b..49fcdde1a4f 100644
--- a/src/Disks/IDiskTransaction.h
+++ b/src/Disks/IDiskTransaction.h
@@ -3,12 +3,17 @@
 #include <string>
 #include <vector>
 #include <boost/noncopyable.hpp>
-#include <Disks/IDisk.h>
 #include <sys/types.h>
+#include <Disks/IDisk.h>
+
 
 namespace DB
 {
 
+struct ReadSettings;
+struct WriteSettings;
+class WriteBufferFromFileBase;
+
 struct RemoveRequest
 {
     std::string path; /// Relative path.
@@ -47,7 +52,7 @@ public:
     /// Move directory from `from_path` to `to_path`.
     virtual void moveDirectory(const std::string & from_path, const std::string & to_path) = 0;
 
-    virtual void moveFile(const String & from_path, const String & to_path) = 0;
+    virtual void moveFile(const std::string & from_path, const std::string & to_path) = 0;
 
     virtual void createFile(const String & path) = 0;
 
@@ -73,10 +78,10 @@ public:
         const WriteSettings & settings = {},
         bool autocommit = true) = 0;
 
-    using WriteBlobFunction = std::function<size_t(const Strings & blob_path, WriteMode mode, const std::optional<ObjectAttributes> & object_attributes)>;
+    using WriteBlobFunction = std::function<size_t(const std::vector<std::string> & blob_path, WriteMode mode, const std::optional<ObjectAttributes> & object_attributes)>;
 
     /// Write a file using a custom function to write an object to the disk's object storage.
-    virtual void writeFileUsingBlobWritingFunction(const String & path, WriteMode mode, WriteBlobFunction && write_blob_function) = 0;
+    virtual void writeFileUsingBlobWritingFunction(const std::string & path, WriteMode mode, WriteBlobFunction && write_blob_function) = 0;
 
     /// Remove file. Throws exception if file doesn't exists or it's a directory.
     virtual void removeFile(const std::string & path) = 0;
diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.h b/src/Disks/IO/ReadBufferFromRemoteFSGather.h
index d5dfa18987a..e36365a8174 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.h
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.h
@@ -39,7 +39,7 @@ public:
 
     void setReadUntilPosition(size_t position) override;
 
-    void setReadUntilEnd() override { return setReadUntilPosition(getFileSize()); }
+    void setReadUntilEnd() override { setReadUntilPosition(getFileSize()); }
 
     size_t getFileSize() override { return getTotalSize(blobs_to_read); }
 
diff --git a/src/IO/Archives/LibArchiveReader.h b/src/IO/Archives/LibArchiveReader.h
index 148d5dd17f2..b991cedcee5 100644
--- a/src/IO/Archives/LibArchiveReader.h
+++ b/src/IO/Archives/LibArchiveReader.h
@@ -2,7 +2,6 @@
 
 #include <mutex>
 #include <IO/Archives/IArchiveReader.h>
-#include <IO/Archives/LibArchiveReader.h>
 #include "config.h"
 
 
diff --git a/src/IO/MMappedFileDescriptor.cpp b/src/IO/MMappedFileDescriptor.cpp
index ebc4e7a6bbb..a7eb8e4ede5 100644
--- a/src/IO/MMappedFileDescriptor.cpp
+++ b/src/IO/MMappedFileDescriptor.cpp
@@ -75,7 +75,7 @@ void MMappedFileDescriptor::set(int fd_, size_t offset_)
 {
     size_t file_size = getFileSize(fd_);
 
-    if (offset > static_cast<size_t>(file_size))
+    if (offset > file_size)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "MMappedFileDescriptor: requested offset is greater than file size");
 
     set(fd_, offset_, file_size - offset);
@@ -101,5 +101,3 @@ MMappedFileDescriptor::~MMappedFileDescriptor()
 }
 
 }
-
-
diff --git a/src/IO/PeekableReadBuffer.cpp b/src/IO/PeekableReadBuffer.cpp
index be650f2f3b4..d1838ce2c4f 100644
--- a/src/IO/PeekableReadBuffer.cpp
+++ b/src/IO/PeekableReadBuffer.cpp
@@ -283,9 +283,7 @@ void PeekableReadBuffer::resizeOwnMemoryIfNecessary(size_t bytes_to_append)
         {
             size_t pos_offset = pos - memory.data();
 
-            size_t new_size_amortized = memory.size() * 2;
-            if (new_size_amortized < new_size)
-                new_size_amortized = new_size;
+            size_t new_size_amortized = std::max(memory.size() * 2, new_size);
             memory.resize(new_size_amortized);
 
             if (need_update_checkpoint)
diff --git a/src/IO/S3/Credentials.cpp b/src/IO/S3/Credentials.cpp
index 80366510b53..fa9d018eaa6 100644
--- a/src/IO/S3/Credentials.cpp
+++ b/src/IO/S3/Credentials.cpp
@@ -202,7 +202,7 @@ static Aws::String getAWSMetadataEndpoint()
     if (ec2_metadata_service_endpoint.empty())
     {
         Aws::String ec2_metadata_service_endpoint_mode = Aws::Environment::GetEnv("AWS_EC2_METADATA_SERVICE_ENDPOINT_MODE");
-        if (ec2_metadata_service_endpoint_mode.length() == 0)
+        if (ec2_metadata_service_endpoint_mode.empty())
         {
             ec2_metadata_service_endpoint = "http://169.254.169.254"; //default to IPv4 default endpoint
         }
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 3ea372f75d8..ff18a77f09f 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -339,7 +339,10 @@ void WriteBufferFromS3::allocateBuffer()
     chassert(0 == hidden_size);
 
     if (buffer_allocation_policy->getBufferNumber() == 1)
-        return allocateFirstBuffer();
+    {
+        allocateFirstBuffer();
+        return;
+    }
 
     memory = Memory(buffer_allocation_policy->getBufferSize());
     WriteBuffer::set(memory.data(), memory.size());
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 1df559b252c..fbfec3588fa 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -12,13 +12,13 @@
 #include <Storages/StorageS3Settings.h>
 #include <Common/threadPoolCallbackRunner.h>
 #include <IO/S3/BlobStorageLogWriter.h>
-#include <Common/ThreadPoolTaskTracker.h>
 #include <Common/BufferAllocationPolicy.h>
 
 #include <memory>
 #include <vector>
 #include <list>
 
+
 namespace DB
 {
 /**
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.h b/src/Interpreters/Cache/LRUFileCachePriority.h
index c5311e39718..6f322355d36 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.h
+++ b/src/Interpreters/Cache/LRUFileCachePriority.h
@@ -6,6 +6,7 @@
 #include <Common/logger_useful.h>
 #include "Interpreters/Cache/Guards.h"
 
+
 namespace DB
 {
 
diff --git a/src/Interpreters/ExternalLoader.h b/src/Interpreters/ExternalLoader.h
index c746ce39b2d..ea801afc931 100644
--- a/src/Interpreters/ExternalLoader.h
+++ b/src/Interpreters/ExternalLoader.h
@@ -144,59 +144,59 @@ public:
     /// Loads a specified object.
     /// The function does nothing if it's already loaded.
     /// The function doesn't throw an exception if it's failed to load.
-    template <typename ReturnType = LoadablePtr, typename = std::enable_if_t<is_scalar_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = LoadablePtr, typename = std::enable_if_t<is_scalar_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType tryLoad(const String & name, Duration timeout = WAIT) const;
 
     /// Loads objects by filter.
     /// The function does nothing for already loaded objects, it just returns them.
     /// The function doesn't throw an exception if it's failed to load something.
-    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType tryLoad(const FilterByNameFunction & filter, Duration timeout = WAIT) const;
 
     /// Loads all objects.
     /// The function does nothing for already loaded objects, it just returns them.
     /// The function doesn't throw an exception if it's failed to load something.
-    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType tryLoadAll(Duration timeout = WAIT) const { return tryLoad<ReturnType>(FilterByNameFunction{}, timeout); }
 
     /// Loads a specified object.
     /// The function does nothing if it's already loaded.
     /// The function throws an exception if it's failed to load.
-    template <typename ReturnType = LoadablePtr, typename = std::enable_if_t<is_scalar_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = LoadablePtr, typename = std::enable_if_t<is_scalar_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType load(const String & name) const;
 
     /// Loads objects by filter.
     /// The function does nothing for already loaded objects, it just returns them.
     /// The function throws an exception if it's failed to load something.
-    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType load(const FilterByNameFunction & filter) const;
 
     /// Loads all objects. Not recommended to use.
     /// The function does nothing for already loaded objects, it just returns them.
     /// The function throws an exception if it's failed to load something.
-    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType loadAll() const { return load<ReturnType>(FilterByNameFunction{}); }
 
     /// Loads or reloads a specified object.
     /// The function reloads the object if it's already loaded.
     /// The function throws an exception if it's failed to load or reload.
-    template <typename ReturnType = LoadablePtr, typename = std::enable_if_t<is_scalar_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = LoadablePtr, typename = std::enable_if_t<is_scalar_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType loadOrReload(const String & name) const;
 
     /// Loads or reloads objects by filter.
     /// The function reloads the objects which are already loaded.
     /// The function throws an exception if it's failed to load or reload something.
-    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType loadOrReload(const FilterByNameFunction & filter) const;
 
     /// Load or reloads all objects. Not recommended to use.
     /// The function throws an exception if it's failed to load or reload something.
-    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType loadOrReloadAll() const { return loadOrReload<ReturnType>(FilterByNameFunction{}); }
 
     /// Reloads objects by filter which were tried to load before (successfully or not).
     /// The function throws an exception if it's failed to load or reload something.
-    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = Loadables, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType reloadAllTriedToLoad() const;
 
     /// Check if object with name exists in configuration
diff --git a/src/Parsers/ASTBackupQuery.cpp b/src/Parsers/ASTBackupQuery.cpp
index bdb78eaf971..bc1dbfc961d 100644
--- a/src/Parsers/ASTBackupQuery.cpp
+++ b/src/Parsers/ASTBackupQuery.cpp
@@ -180,7 +180,7 @@ namespace
         if (settings)
             changes = assert_cast<ASTSetQuery *>(settings.get())->changes;
 
-        boost::remove_erase_if(
+        boost::remove_erase_if( // NOLINT
             changes,
             [](const SettingChange & change)
             {
diff --git a/src/Parsers/ASTCheckQuery.h b/src/Parsers/ASTCheckQuery.h
index eca08b2b094..9dc4155c39d 100644
--- a/src/Parsers/ASTCheckQuery.h
+++ b/src/Parsers/ASTCheckQuery.h
@@ -38,11 +38,7 @@ struct ASTCheckTableQuery : public ASTQueryWithTableAndOutput
 protected:
     void formatQueryImpl(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const override
     {
-        std::string nl_or_nothing = settings.one_line ? "" : "\n";
-
         std::string indent_str = settings.one_line ? "" : std::string(4 * frame.indent, ' ');
-        std::string nl_or_ws = settings.one_line ? " " : "\n";
-
         settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << "CHECK TABLE " << (settings.hilite ? hilite_none : "");
 
         if (table)
@@ -83,11 +79,7 @@ struct ASTCheckAllTablesQuery : public ASTQueryWithOutput
 protected:
     void formatQueryImpl(const FormatSettings & settings, FormatState & /* state */, FormatStateStacked frame) const override
     {
-        std::string nl_or_nothing = settings.one_line ? "" : "\n";
-
         std::string indent_str = settings.one_line ? "" : std::string(4 * frame.indent, ' ');
-        std::string nl_or_ws = settings.one_line ? " " : "\n";
-
         settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str << "CHECK ALL TABLES" << (settings.hilite ? hilite_none : "");
     }
 };
diff --git a/src/Parsers/IParser.cpp b/src/Parsers/IParser.cpp
index ddd210b01ec..857009680b1 100644
--- a/src/Parsers/IParser.cpp
+++ b/src/Parsers/IParser.cpp
@@ -14,10 +14,7 @@ IParser::Pos & IParser::Pos::operator=(const IParser::Pos & rhs)
 {
     depth = rhs.depth;
     max_depth = rhs.max_depth;
-
-    if (rhs.backtracks > backtracks)
-        backtracks = rhs.backtracks;
-
+    backtracks = std::max(backtracks, rhs.backtracks);
     max_backtracks = rhs.max_backtracks;
 
     if (rhs < *this)
diff --git a/src/Parsers/Lexer.cpp b/src/Parsers/Lexer.cpp
index 15f0c83c074..9ac6e623803 100644
--- a/src/Parsers/Lexer.cpp
+++ b/src/Parsers/Lexer.cpp
@@ -484,7 +484,7 @@ Token Lexer::nextTokenImpl()
                 if (heredoc_name_end_position != std::string::npos)
                 {
                     size_t heredoc_size = heredoc_name_end_position + 1;
-                    std::string_view heredoc = {token_stream.data(), heredoc_size};
+                    std::string_view heredoc = {token_stream.data(), heredoc_size}; // NOLINT
 
                     size_t heredoc_end_position = token_stream.find(heredoc, heredoc_size);
                     if (heredoc_end_position != std::string::npos)
diff --git a/src/Parsers/ParserBackupQuery.cpp b/src/Parsers/ParserBackupQuery.cpp
index 5eab0cb288d..6a86edd7e2f 100644
--- a/src/Parsers/ParserBackupQuery.cpp
+++ b/src/Parsers/ParserBackupQuery.cpp
@@ -304,7 +304,7 @@ namespace
             changes = assert_cast<ASTSetQuery *>(settings.get())->changes;
         }
 
-        boost::remove_erase_if(changes, [](const SettingChange & change) { return change.name == "async"; });
+        boost::remove_erase_if(changes, [](const SettingChange & change) { return change.name == "async"; }); // NOLINT
         changes.emplace_back("async", async);
 
         auto new_settings = std::make_shared<ASTSetQuery>();
diff --git a/src/Parsers/makeASTForLogicalFunction.cpp b/src/Parsers/makeASTForLogicalFunction.cpp
index fd9b78a5f52..416441f210b 100644
--- a/src/Parsers/makeASTForLogicalFunction.cpp
+++ b/src/Parsers/makeASTForLogicalFunction.cpp
@@ -12,7 +12,7 @@ namespace DB
 ASTPtr makeASTForLogicalAnd(ASTs && arguments)
 {
     bool partial_result = true;
-    boost::range::remove_erase_if(arguments, [&](const ASTPtr & argument) -> bool
+    boost::range::remove_erase_if(arguments, [&](const ASTPtr & argument) -> bool // NOLINT
     {
         bool b;
         if (!tryGetLiteralBool(argument.get(), b))
@@ -41,7 +41,7 @@ ASTPtr makeASTForLogicalAnd(ASTs && arguments)
 ASTPtr makeASTForLogicalOr(ASTs && arguments)
 {
     bool partial_result = false;
-    boost::range::remove_erase_if(arguments, [&](const ASTPtr & argument) -> bool
+    boost::range::remove_erase_if(arguments, [&](const ASTPtr & argument) -> bool // NOLINT
     {
         bool b;
         if (!tryGetLiteralBool(argument.get(), b))

From 97f24f38b83081f6c53cfbbf110d4dba504782a1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 9 May 2024 03:14:26 +0200
Subject: [PATCH 187/289] Useless changes

---
 base/base/map.h                        | 12 ++++++------
 src/Storages/MergeTree/localBackup.cpp |  2 ++
 2 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/base/base/map.h b/base/base/map.h
index 043d8363619..0de42ebfdf6 100644
--- a/base/base/map.h
+++ b/base/base/map.h
@@ -19,8 +19,8 @@ auto map(const Collection<Params...> & collection, Mapper && mapper)
     using value_type = unqualified_t<decltype(mapper(*std::begin(collection)))>;
 
     return Collection<value_type>(
-        boost::make_transform_iterator(std::begin(collection), std::forward<Mapper>(mapper)),
-        boost::make_transform_iterator(std::end(collection), std::forward<Mapper>(mapper)));
+        boost::make_transform_iterator(std::begin(collection), mapper),
+        boost::make_transform_iterator(std::end(collection), mapper));
 }
 
 /** \brief Returns collection of specified container-type,
@@ -33,8 +33,8 @@ auto map(const Collection & collection, Mapper && mapper)
     using value_type = unqualified_t<decltype(mapper(*std::begin(collection)))>;
 
     return ResultCollection<value_type>(
-        boost::make_transform_iterator(std::begin(collection), std::forward<Mapper>(mapper)),
-        boost::make_transform_iterator(std::end(collection), std::forward<Mapper>(mapper)));
+        boost::make_transform_iterator(std::begin(collection), mapper),
+        boost::make_transform_iterator(std::end(collection), mapper));
 }
 
 /** \brief Returns collection of specified type,
@@ -45,8 +45,8 @@ template <typename ResultCollection, typename Collection, typename Mapper>
 auto map(const Collection & collection, Mapper && mapper)
 {
     return ResultCollection(
-        boost::make_transform_iterator(std::begin(collection), std::forward<Mapper>(mapper)),
-        boost::make_transform_iterator(std::end(collection), std::forward<Mapper>(mapper)));
+        boost::make_transform_iterator(std::begin(collection), mapper),
+        boost::make_transform_iterator(std::end(collection), mapper));
 }
 
 }
diff --git a/src/Storages/MergeTree/localBackup.cpp b/src/Storages/MergeTree/localBackup.cpp
index 0698848fa70..70a2f4ff976 100644
--- a/src/Storages/MergeTree/localBackup.cpp
+++ b/src/Storages/MergeTree/localBackup.cpp
@@ -1,9 +1,11 @@
 #include "localBackup.h"
 
 #include <Common/Exception.h>
+#include <Disks/IDiskTransaction.h>
 #include <string>
 #include <cerrno>
 
+
 namespace DB
 {
 

From 224e1940ae575c0b217b7f733576ae4dbce0fa08 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 9 May 2024 03:58:34 +0200
Subject: [PATCH 188/289] Useless changes

---
 .clang-tidy                                   |  1 +
 contrib/abseil-cpp-cmake/CMakeLists.txt       |  4 ++--
 programs/install/Install.cpp                  | 10 ++++----
 programs/odbc-bridge/getIdentifierQuote.cpp   |  2 +-
 .../static-files-disk-uploader.cpp            |  2 --
 src/Access/Common/AccessFlags.cpp             | 16 ++++++-------
 src/Common/AsynchronousMetrics.cpp            |  2 +-
 src/Common/PODArray.h                         |  2 +-
 .../Nodes/DynamicResourceManager.cpp          |  2 +-
 src/Common/ZooKeeper/TestKeeper.cpp           |  2 +-
 src/Compression/CompressionCodecT64.cpp       | 24 ++++++++++++-------
 src/Disks/IO/AsynchronousBoundedReadBuffer.h  |  2 +-
 src/Functions/IFunction.cpp                   |  2 +-
 src/Functions/array/arrayIndex.h              |  2 +-
 src/IO/ReadBufferFromFileDescriptor.cpp       |  2 +-
 src/IO/WriteHelpers.cpp                       |  6 ++---
 src/IO/parseDateTimeBestEffort.cpp            |  4 ++--
 src/Interpreters/Cache/IFileCachePriority.h   |  1 -
 src/Interpreters/Cache/LRUFileCachePriority.h |  2 +-
 src/Interpreters/ExternalLoader.h             |  6 ++---
 src/Interpreters/InterpreterRenameQuery.cpp   |  1 -
 src/Parsers/ASTFunction.cpp                   |  6 ++---
 src/Parsers/ASTTablesInSelectQuery.cpp        |  2 --
 src/Parsers/Access/ParserGrantQuery.cpp       |  2 +-
 .../KustoFunctions/KQLDataTypeFunctions.cpp   |  1 -
 .../KustoFunctions/KQLDateTimeFunctions.h     |  2 +-
 src/Parsers/parseQuery.cpp                    |  4 +---
 src/Storages/StorageProxy.h                   |  2 +-
 28 files changed, 57 insertions(+), 57 deletions(-)

diff --git a/.clang-tidy b/.clang-tidy
index 44690ee181f..2086f3202c5 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -130,6 +130,7 @@ Checks: [
   '-readability-redundant-inline-specifier',
   '-readability-redundant-member-init',
   '-bugprone-crtp-constructor-accessibility',
+  '-bugprone-suspicious-stringview-data-usage',
 
   '-zircon-*'
 ]
diff --git a/contrib/abseil-cpp-cmake/CMakeLists.txt b/contrib/abseil-cpp-cmake/CMakeLists.txt
index e6c3268c57a..7372195bb0d 100644
--- a/contrib/abseil-cpp-cmake/CMakeLists.txt
+++ b/contrib/abseil-cpp-cmake/CMakeLists.txt
@@ -52,7 +52,7 @@ function(absl_cc_library)
       )
 
     target_include_directories(${_NAME}
-      PUBLIC "${ABSL_COMMON_INCLUDE_DIRS}")
+      SYSTEM PUBLIC "${ABSL_COMMON_INCLUDE_DIRS}")
     target_compile_options(${_NAME}
       PRIVATE ${ABSL_CC_LIB_COPTS})
     target_compile_definitions(${_NAME} PUBLIC ${ABSL_CC_LIB_DEFINES})
@@ -61,7 +61,7 @@ function(absl_cc_library)
     # Generating header-only library
     add_library(${_NAME} INTERFACE)
     target_include_directories(${_NAME}
-      INTERFACE "${ABSL_COMMON_INCLUDE_DIRS}")
+      SYSTEM INTERFACE "${ABSL_COMMON_INCLUDE_DIRS}")
 
     target_link_libraries(${_NAME}
       INTERFACE
diff --git a/programs/install/Install.cpp b/programs/install/Install.cpp
index 6bed114238a..d6576927a20 100644
--- a/programs/install/Install.cpp
+++ b/programs/install/Install.cpp
@@ -323,7 +323,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
                     {
                         fmt::print("Symlink {} already exists but it points to {}. Will replace the old symlink to {}.\n",
                                    main_bin_path.string(), points_to.string(), binary_self_canonical_path.string());
-                        fs::remove(main_bin_path);
+                        (void)fs::remove(main_bin_path);
                     }
                 }
             }
@@ -489,7 +489,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
                         {
                             fmt::print("Symlink {} already exists but it points to {}. Will replace the old symlink to {}.\n",
                                        symlink_path.string(), points_to.string(), main_bin_path.string());
-                            fs::remove(symlink_path);
+                            (void)fs::remove(symlink_path);
                         }
                     }
                 }
@@ -1006,7 +1006,7 @@ namespace
             else
             {
                 fmt::print("{} file exists but damaged, ignoring.\n", pid_file.string());
-                fs::remove(pid_file);
+                (void)fs::remove(pid_file);
             }
         }
         else
@@ -1014,7 +1014,7 @@ namespace
             /// Create a directory for pid file.
             /// It's created by "install" but we also support cases when ClickHouse is already installed different way.
             fs::path pid_path = pid_file;
-            pid_path.remove_filename();
+            pid_path = pid_path.remove_filename();
             fs::create_directories(pid_path);
             /// All users are allowed to read pid file (for clickhouse status command).
             fs::permissions(pid_path, fs::perms::owner_all | fs::perms::group_read | fs::perms::others_read, fs::perm_options::replace);
@@ -1098,7 +1098,7 @@ namespace
                 else
                 {
                     fmt::print("{} file exists but damaged, ignoring.\n", pid_file.string());
-                    fs::remove(pid_file);
+                    (void)fs::remove(pid_file);
                 }
             }
             catch (const Exception & e)
diff --git a/programs/odbc-bridge/getIdentifierQuote.cpp b/programs/odbc-bridge/getIdentifierQuote.cpp
index 15bd055e615..c0c833e5b8c 100644
--- a/programs/odbc-bridge/getIdentifierQuote.cpp
+++ b/programs/odbc-bridge/getIdentifierQuote.cpp
@@ -37,7 +37,7 @@ std::string getIdentifierQuote(nanodbc::ConnectionHolderPtr connection_holder)
 IdentifierQuotingStyle getQuotingStyle(nanodbc::ConnectionHolderPtr connection)
 {
     auto identifier_quote = getIdentifierQuote(connection);
-    if (identifier_quote.length() == 0)
+    if (identifier_quote.empty())
         return IdentifierQuotingStyle::None;
     else if (identifier_quote[0] == '`')
         return IdentifierQuotingStyle::Backticks;
diff --git a/programs/static-files-disk-uploader/static-files-disk-uploader.cpp b/programs/static-files-disk-uploader/static-files-disk-uploader.cpp
index dfe68c819fc..f7696dd37f1 100644
--- a/programs/static-files-disk-uploader/static-files-disk-uploader.cpp
+++ b/programs/static-files-disk-uploader/static-files-disk-uploader.cpp
@@ -111,13 +111,11 @@ void processTableFiles(const fs::path & data_path, fs::path dst_path, bool test_
             std::shared_ptr<WriteBuffer> directory_meta;
             if (test_mode)
             {
-                auto files_root = dst_path / prefix;
                 directory_meta = std::make_shared<WriteBufferFromHTTP>(HTTPConnectionGroupType::HTTP, Poco::URI(dst_path / directory_prefix / ".index"), Poco::Net::HTTPRequest::HTTP_PUT);
             }
             else
             {
                 dst_path = fs::canonical(dst_path);
-                auto files_root = dst_path / prefix;
                 fs::create_directories(dst_path / directory_prefix);
                 directory_meta = std::make_shared<WriteBufferFromFile>(dst_path / directory_prefix / ".index");
             }
diff --git a/src/Access/Common/AccessFlags.cpp b/src/Access/Common/AccessFlags.cpp
index 9d846821e42..23c52d86f4e 100644
--- a/src/Access/Common/AccessFlags.cpp
+++ b/src/Access/Common/AccessFlags.cpp
@@ -115,15 +115,15 @@ namespace
         {
             UNKNOWN = -2,
             GROUP = -1,
-            GLOBAL,
-            DATABASE,
-            TABLE,
+            GLOBAL = 0,
+            DATABASE = 1,
+            TABLE = 2,
             VIEW = TABLE,
-            COLUMN,
-            DICTIONARY,
-            NAMED_COLLECTION,
-            USER_NAME,
-            TABLE_ENGINE,
+            COLUMN = 3,
+            DICTIONARY = 4,
+            NAMED_COLLECTION = 5,
+            USER_NAME = 6,
+            TABLE_ENGINE = 7,
         };
 
         struct Node;
diff --git a/src/Common/AsynchronousMetrics.cpp b/src/Common/AsynchronousMetrics.cpp
index 6b26f65deab..4c71b9846c7 100644
--- a/src/Common/AsynchronousMetrics.cpp
+++ b/src/Common/AsynchronousMetrics.cpp
@@ -1159,7 +1159,7 @@ void AsynchronousMetrics::update(TimePoint update_time, bool force_update)
 
                     core_id = std::stoi(s.substr(core_id_start));
                 }
-                else if (s.rfind("cpu MHz", 0) == 0)
+                else if (s.starts_with("cpu MHz"))
                 {
                     if (auto colon = s.find_first_of(':'))
                     {
diff --git a/src/Common/PODArray.h b/src/Common/PODArray.h
index 02281eb776a..b4069027ad1 100644
--- a/src/Common/PODArray.h
+++ b/src/Common/PODArray.h
@@ -424,7 +424,7 @@ public:
         if (unlikely(this->c_end + sizeof(T) > this->c_end_of_storage))
             this->reserveForNextSize(std::forward<TAllocatorParams>(allocator_params)...);
 
-        new (t_end()) T(std::forward<U>(x));
+        new (reinterpret_cast<void*>(t_end())) T(std::forward<U>(x));
         this->c_end += sizeof(T);
     }
 
diff --git a/src/Common/Scheduler/Nodes/DynamicResourceManager.cpp b/src/Common/Scheduler/Nodes/DynamicResourceManager.cpp
index 3ab85c81428..b568b9245ba 100644
--- a/src/Common/Scheduler/Nodes/DynamicResourceManager.cpp
+++ b/src/Common/Scheduler/Nodes/DynamicResourceManager.cpp
@@ -61,7 +61,7 @@ DynamicResourceManager::State::Resource::Resource(
 
     // Create nodes
     bool has_root = false;
-    for (auto [path, key] : path2key)
+    for (const auto & [path, key] : path2key)
     {
         // Validate path
         size_t slash = path.rfind('/');
diff --git a/src/Common/ZooKeeper/TestKeeper.cpp b/src/Common/ZooKeeper/TestKeeper.cpp
index fce29a21e15..d02ad4523ad 100644
--- a/src/Common/ZooKeeper/TestKeeper.cpp
+++ b/src/Common/ZooKeeper/TestKeeper.cpp
@@ -888,7 +888,7 @@ void TestKeeper::multi(
         const Requests & requests,
         MultiCallback callback)
 {
-    return multi(std::span(requests), std::move(callback));
+    multi(std::span(requests), std::move(callback));
 }
 
 void TestKeeper::multi(
diff --git a/src/Compression/CompressionCodecT64.cpp b/src/Compression/CompressionCodecT64.cpp
index 9e9b32cf34b..8040e2c4d50 100644
--- a/src/Compression/CompressionCodecT64.cpp
+++ b/src/Compression/CompressionCodecT64.cpp
@@ -689,21 +689,29 @@ void CompressionCodecT64::doDecompressData(const char * src, UInt32 src_size, ch
     switch (baseType(saved_type_id))
     {
         case TypeIndex::Int8:
-            return decompressData<Int8>(src, src_size, dst, uncompressed_size, saved_variant);
+            decompressData<Int8>(src, src_size, dst, uncompressed_size, saved_variant);
+            return;
         case TypeIndex::Int16:
-            return decompressData<Int16>(src, src_size, dst, uncompressed_size, saved_variant);
+            decompressData<Int16>(src, src_size, dst, uncompressed_size, saved_variant);
+            return;
         case TypeIndex::Int32:
-            return decompressData<Int32>(src, src_size, dst, uncompressed_size, saved_variant);
+            decompressData<Int32>(src, src_size, dst, uncompressed_size, saved_variant);
+            return;
         case TypeIndex::Int64:
-            return decompressData<Int64>(src, src_size, dst, uncompressed_size, saved_variant);
+            decompressData<Int64>(src, src_size, dst, uncompressed_size, saved_variant);
+            return;
         case TypeIndex::UInt8:
-            return decompressData<UInt8>(src, src_size, dst, uncompressed_size, saved_variant);
+            decompressData<UInt8>(src, src_size, dst, uncompressed_size, saved_variant);
+            return;
         case TypeIndex::UInt16:
-            return decompressData<UInt16>(src, src_size, dst, uncompressed_size, saved_variant);
+            decompressData<UInt16>(src, src_size, dst, uncompressed_size, saved_variant);
+            return;
         case TypeIndex::UInt32:
-            return decompressData<UInt32>(src, src_size, dst, uncompressed_size, saved_variant);
+            decompressData<UInt32>(src, src_size, dst, uncompressed_size, saved_variant);
+            return;
         case TypeIndex::UInt64:
-            return decompressData<UInt64>(src, src_size, dst, uncompressed_size, saved_variant);
+            decompressData<UInt64>(src, src_size, dst, uncompressed_size, saved_variant);
+            return;
         default:
             break;
     }
diff --git a/src/Disks/IO/AsynchronousBoundedReadBuffer.h b/src/Disks/IO/AsynchronousBoundedReadBuffer.h
index 6dc76352aca..9a802348998 100644
--- a/src/Disks/IO/AsynchronousBoundedReadBuffer.h
+++ b/src/Disks/IO/AsynchronousBoundedReadBuffer.h
@@ -44,7 +44,7 @@ public:
 
     void setReadUntilPosition(size_t position) override; /// [..., position).
 
-    void setReadUntilEnd() override { return setReadUntilPosition(getFileSize()); }
+    void setReadUntilEnd() override { setReadUntilPosition(getFileSize()); }
 
     size_t getFileOffsetOfBufferEnd() const override  { return file_offset_of_buffer_end; }
 
diff --git a/src/Functions/IFunction.cpp b/src/Functions/IFunction.cpp
index d4c6b8f4ba6..7694875b535 100644
--- a/src/Functions/IFunction.cpp
+++ b/src/Functions/IFunction.cpp
@@ -454,7 +454,7 @@ FunctionBasePtr IFunctionOverloadResolver::build(const ColumnsWithTypeAndName &
 void IFunctionOverloadResolver::getLambdaArgumentTypes(DataTypes & arguments [[maybe_unused]]) const
 {
     checkNumberOfArguments(arguments.size());
-    return getLambdaArgumentTypesImpl(arguments);
+    getLambdaArgumentTypesImpl(arguments);
 }
 
 DataTypePtr IFunctionOverloadResolver::getReturnTypeWithoutLowCardinality(const ColumnsWithTypeAndName & arguments) const
diff --git a/src/Functions/array/arrayIndex.h b/src/Functions/array/arrayIndex.h
index cd537763b4a..70d76fc4484 100644
--- a/src/Functions/array/arrayIndex.h
+++ b/src/Functions/array/arrayIndex.h
@@ -975,7 +975,7 @@ private:
                     break;
             }
 
-            return result_type->createColumnConst(item_arg->size(), static_cast<ResultType>(current));
+            return result_type->createColumnConst(item_arg->size(), current);
         }
         else
         {
diff --git a/src/IO/ReadBufferFromFileDescriptor.cpp b/src/IO/ReadBufferFromFileDescriptor.cpp
index 57442a15853..76a80f145e7 100644
--- a/src/IO/ReadBufferFromFileDescriptor.cpp
+++ b/src/IO/ReadBufferFromFileDescriptor.cpp
@@ -173,7 +173,7 @@ off_t ReadBufferFromFileDescriptor::seek(off_t offset, int whence)
     if (new_pos + (working_buffer.end() - pos) == file_offset_of_buffer_end)
         return new_pos;
 
-    if (file_offset_of_buffer_end - working_buffer.size() <= static_cast<size_t>(new_pos)
+    if (file_offset_of_buffer_end - working_buffer.size() <= new_pos
         && new_pos <= file_offset_of_buffer_end)
     {
         /// Position is still inside the buffer.
diff --git a/src/IO/WriteHelpers.cpp b/src/IO/WriteHelpers.cpp
index 88c706a590f..622f93719ac 100644
--- a/src/IO/WriteHelpers.cpp
+++ b/src/IO/WriteHelpers.cpp
@@ -102,17 +102,17 @@ static inline void writeProbablyQuotedStringImpl(StringRef s, WriteBuffer & buf,
 
 void writeProbablyBackQuotedString(StringRef s, WriteBuffer & buf)
 {
-    writeProbablyQuotedStringImpl(s, buf, [](StringRef s_, WriteBuffer & buf_) { return writeBackQuotedString(s_, buf_); });
+    writeProbablyQuotedStringImpl(s, buf, [](StringRef s_, WriteBuffer & buf_) { writeBackQuotedString(s_, buf_); });
 }
 
 void writeProbablyDoubleQuotedString(StringRef s, WriteBuffer & buf)
 {
-    writeProbablyQuotedStringImpl(s, buf, [](StringRef s_, WriteBuffer & buf_) { return writeDoubleQuotedString(s_, buf_); });
+    writeProbablyQuotedStringImpl(s, buf, [](StringRef s_, WriteBuffer & buf_) { writeDoubleQuotedString(s_, buf_); });
 }
 
 void writeProbablyBackQuotedStringMySQL(StringRef s, WriteBuffer & buf)
 {
-    writeProbablyQuotedStringImpl(s, buf, [](StringRef s_, WriteBuffer & buf_) { return writeBackQuotedStringMySQL(s_, buf_); });
+    writeProbablyQuotedStringImpl(s, buf, [](StringRef s_, WriteBuffer & buf_) { writeBackQuotedStringMySQL(s_, buf_); });
 }
 
 void writePointerHex(const void * ptr, WriteBuffer & buf)
diff --git a/src/IO/parseDateTimeBestEffort.cpp b/src/IO/parseDateTimeBestEffort.cpp
index 83928b32f2f..70401fdf72d 100644
--- a/src/IO/parseDateTimeBestEffort.cpp
+++ b/src/IO/parseDateTimeBestEffort.cpp
@@ -712,12 +712,12 @@ bool tryParseDateTimeBestEffortUS(time_t & res, ReadBuffer & in, const DateLUTIm
 
 void parseDateTime64BestEffort(DateTime64 & res, UInt32 scale, ReadBuffer & in, const DateLUTImpl & local_time_zone, const DateLUTImpl & utc_time_zone)
 {
-    return parseDateTime64BestEffortImpl<void, false>(res, scale, in, local_time_zone, utc_time_zone);
+    parseDateTime64BestEffortImpl<void, false>(res, scale, in, local_time_zone, utc_time_zone);
 }
 
 void parseDateTime64BestEffortUS(DateTime64 & res, UInt32 scale, ReadBuffer & in, const DateLUTImpl & local_time_zone, const DateLUTImpl & utc_time_zone)
 {
-    return parseDateTime64BestEffortImpl<void, true>(res, scale, in, local_time_zone, utc_time_zone);
+    parseDateTime64BestEffortImpl<void, true>(res, scale, in, local_time_zone, utc_time_zone);
 }
 
 bool tryParseDateTime64BestEffort(DateTime64 & res, UInt32 scale, ReadBuffer & in, const DateLUTImpl & local_time_zone, const DateLUTImpl & utc_time_zone)
diff --git a/src/Interpreters/Cache/IFileCachePriority.h b/src/Interpreters/Cache/IFileCachePriority.h
index bb7b220c1f9..5d8eb9dd54a 100644
--- a/src/Interpreters/Cache/IFileCachePriority.h
+++ b/src/Interpreters/Cache/IFileCachePriority.h
@@ -5,7 +5,6 @@
 #include <Common/Exception.h>
 #include <Interpreters/Cache/FileSegmentInfo.h>
 #include <Interpreters/Cache/Guards.h>
-#include <Interpreters/Cache/IFileCachePriority.h>
 #include <Interpreters/Cache/FileCache_fwd_internal.h>
 #include <Interpreters/Cache/UserInfo.h>
 
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.h b/src/Interpreters/Cache/LRUFileCachePriority.h
index 6f322355d36..e0691cade43 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.h
+++ b/src/Interpreters/Cache/LRUFileCachePriority.h
@@ -81,7 +81,7 @@ public:
     };
     PriorityDumpPtr dump(const CachePriorityGuard::Lock &) override;
 
-    void pop(const CachePriorityGuard::Lock & lock) { remove(queue.begin(), lock); }
+    void pop(const CachePriorityGuard::Lock & lock) { remove(queue.begin(), lock); } // NOLINT
 
     bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CachePriorityGuard::Lock &) override;
 
diff --git a/src/Interpreters/ExternalLoader.h b/src/Interpreters/ExternalLoader.h
index ea801afc931..49b5e68d821 100644
--- a/src/Interpreters/ExternalLoader.h
+++ b/src/Interpreters/ExternalLoader.h
@@ -110,17 +110,17 @@ public:
 
     /// Returns the result of loading the object.
     /// The function doesn't load anything, it just returns the current load result as is.
-    template <typename ReturnType = LoadResult, typename = std::enable_if_t<is_scalar_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = LoadResult, typename = std::enable_if_t<is_scalar_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType getLoadResult(const String & name) const;
 
     using FilterByNameFunction = std::function<bool(const String &)>;
 
     /// Returns all the load results as a map.
     /// The function doesn't load anything, it just returns the current load results as is.
-    template <typename ReturnType = LoadResults, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = LoadResults, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType getLoadResults() const { return getLoadResults<ReturnType>(FilterByNameFunction{}); }
 
-    template <typename ReturnType = LoadResults, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>>
+    template <typename ReturnType = LoadResults, typename = std::enable_if_t<is_vector_load_result_type<ReturnType>, void>> // NOLINT
     ReturnType getLoadResults(const FilterByNameFunction & filter) const;
 
     /// Returns all loaded objects as a map.
diff --git a/src/Interpreters/InterpreterRenameQuery.cpp b/src/Interpreters/InterpreterRenameQuery.cpp
index b63672f1757..eeb762b4d7e 100644
--- a/src/Interpreters/InterpreterRenameQuery.cpp
+++ b/src/Interpreters/InterpreterRenameQuery.cpp
@@ -40,7 +40,6 @@ BlockIO InterpreterRenameQuery::execute()
 
     getContext()->checkAccess(getRequiredAccess(rename.database ? RenameType::RenameDatabase : RenameType::RenameTable));
 
-    String path = getContext()->getPath();
     String current_database = getContext()->getCurrentDatabase();
 
     /** In case of error while renaming, it is possible that only part of tables was renamed
diff --git a/src/Parsers/ASTFunction.cpp b/src/Parsers/ASTFunction.cpp
index cdc9a471e98..602ef8c232b 100644
--- a/src/Parsers/ASTFunction.cpp
+++ b/src/Parsers/ASTFunction.cpp
@@ -671,7 +671,8 @@ void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, Format
 
     if (written)
     {
-        return finishFormatWithWindow(settings, state, frame);
+        finishFormatWithWindow(settings, state, frame);
+        return;
     }
 
     settings.ostr << (settings.hilite ? hilite_function : "") << name;
@@ -753,8 +754,7 @@ void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, Format
         settings.ostr << (settings.hilite ? hilite_function : "") << ')';
 
     settings.ostr << (settings.hilite ? hilite_none : "");
-
-    return finishFormatWithWindow(settings, state, frame);
+    finishFormatWithWindow(settings, state, frame);
 }
 
 bool ASTFunction::hasSecretParts() const
diff --git a/src/Parsers/ASTTablesInSelectQuery.cpp b/src/Parsers/ASTTablesInSelectQuery.cpp
index 8ca2ee0efae..e782bad797e 100644
--- a/src/Parsers/ASTTablesInSelectQuery.cpp
+++ b/src/Parsers/ASTTablesInSelectQuery.cpp
@@ -285,8 +285,6 @@ void ASTTablesInSelectQueryElement::formatImpl(const FormatSettings & settings,
 
 void ASTTablesInSelectQuery::formatImpl(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const
 {
-    std::string indent_str = settings.one_line ? "" : std::string(4 * frame.indent, ' ');
-
     for (const auto & child : children)
         child->formatImpl(settings, state, frame);
 }
diff --git a/src/Parsers/Access/ParserGrantQuery.cpp b/src/Parsers/Access/ParserGrantQuery.cpp
index 799cd65dd5c..42af7d1cda4 100644
--- a/src/Parsers/Access/ParserGrantQuery.cpp
+++ b/src/Parsers/Access/ParserGrantQuery.cpp
@@ -219,7 +219,7 @@ namespace
 
     void throwIfNotGrantable(AccessRightsElements & elements)
     {
-        boost::range::remove_erase_if(elements, [](AccessRightsElement & element)
+        boost::range::remove_erase_if(elements, [](AccessRightsElement & element) // NOLINT
         {
             if (element.empty())
                 return true;
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLDataTypeFunctions.cpp b/src/Parsers/Kusto/KustoFunctions/KQLDataTypeFunctions.cpp
index cca4fb3ce33..3b1f96b4ea6 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLDataTypeFunctions.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/KQLDataTypeFunctions.cpp
@@ -137,7 +137,6 @@ bool DatatypeInt::convertImpl(String & out, IParser::Pos & pos)
     const String fn_name = getKQLFunctionName(pos);
     if (fn_name.empty())
         return false;
-    String guid_str;
 
     ++pos;
     if (pos->type == TokenType::QuotedIdentifier || pos->type == TokenType::StringLiteral)
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLDateTimeFunctions.h b/src/Parsers/Kusto/KustoFunctions/KQLDateTimeFunctions.h
index 77ed110700b..05de6e120e2 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLDateTimeFunctions.h
+++ b/src/Parsers/Kusto/KustoFunctions/KQLDateTimeFunctions.h
@@ -240,7 +240,7 @@ void inline getTokens(String format, std::vector<String> & res)
         pos = str.find_first_not_of("abcdefghijklmnopqrstuvwxyzQWERTYUIOPASDFGHJKLZXCVBNM");
     }
     // Cover the last (or only) token
-    if (str.length() > 0)
+    if (!str.empty())
     {
         token = str;
         res.insert(res.begin(), token);
diff --git a/src/Parsers/parseQuery.cpp b/src/Parsers/parseQuery.cpp
index 2a6abc23406..66bd76687aa 100644
--- a/src/Parsers/parseQuery.cpp
+++ b/src/Parsers/parseQuery.cpp
@@ -92,9 +92,7 @@ void writeQueryWithHighlightedErrorPositions(
         }
         else
         {
-            ssize_t bytes_to_hilite = UTF8::seqLength(*current_position_to_hilite);
-            if (bytes_to_hilite > end - current_position_to_hilite)
-                bytes_to_hilite = end - current_position_to_hilite;
+            ssize_t bytes_to_hilite = std::min<ssize_t>(UTF8::seqLength(*current_position_to_hilite), end - current_position_to_hilite);
 
             /// Bright on red background.
             out << "\033[41;1m";
diff --git a/src/Storages/StorageProxy.h b/src/Storages/StorageProxy.h
index a8e7fd528dd..5cd86f7ad2c 100644
--- a/src/Storages/StorageProxy.h
+++ b/src/Storages/StorageProxy.h
@@ -62,7 +62,7 @@ public:
         size_t max_block_size,
         size_t num_streams) override
     {
-        return getNested()->read(query_plan, column_names, storage_snapshot, query_info, context, processed_stage, max_block_size, num_streams);
+        getNested()->read(query_plan, column_names, storage_snapshot, query_info, context, processed_stage, max_block_size, num_streams);
     }
 
     SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, bool async_insert) override

From c198bbcafbcbda5c20c0e261291b9ce1be0cc4af Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 9 May 2024 04:20:54 +0200
Subject: [PATCH 189/289] Useless changes

---
 src/Access/AccessBackup.cpp                        |  2 --
 src/Access/AccessRights.cpp                        |  8 ++++----
 src/Access/AuthenticationData.cpp                  | 11 +++++++----
 src/Access/DiskAccessStorage.cpp                   |  8 ++++----
 src/Access/GrantedRoles.cpp                        |  4 ++--
 src/Access/IAccessStorage.cpp                      |  2 +-
 src/Access/LDAPAccessStorage.cpp                   |  6 +++---
 src/Access/LDAPClient.cpp                          |  2 +-
 src/Access/MemoryAccessStorage.cpp                 |  6 +++---
 src/Access/MultipleAccessStorage.cpp               |  2 +-
 src/Access/ReplicatedAccessStorage.cpp             |  4 ++--
 src/Access/SettingsConstraints.cpp                 |  6 +++---
 src/Backups/BackupIO_File.cpp                      |  6 +++---
 src/Backups/BackupsWorker.cpp                      | 12 ++++++------
 src/Backups/RestoreCoordinationLocal.cpp           |  2 --
 src/Backups/RestorerFromBackup.cpp                 |  4 ++--
 .../NamedCollectionConfiguration.cpp               |  4 +++-
 .../NamedCollections/NamedCollectionUtils.cpp      |  6 +++---
 src/Common/NamedCollections/NamedCollections.cpp   |  4 ++--
 src/Core/MySQL/MySQLReplication.cpp                | 14 +++++++-------
 src/Core/MySQL/MySQLReplication.h                  |  2 +-
 src/Core/PostgreSQL/insertPostgreSQLValue.cpp      |  9 +++------
 src/Databases/PostgreSQL/DatabasePostgreSQL.cpp    |  6 +++---
 src/Disks/ObjectStorages/DiskObjectStorage.h       |  2 +-
 .../MetadataStorageFromPlainObjectStorage.cpp      |  2 +-
 src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp    |  1 -
 src/Storages/Cache/RemoteCacheController.cpp       |  2 +-
 src/Storages/FileLog/StorageFileLog.cpp            |  4 ++--
 src/Storages/HDFS/HDFSCommon.cpp                   |  1 -
 src/Storages/Hive/StorageHive.cpp                  |  4 +---
 src/Storages/Hive/StorageHive.h                    |  8 ++++----
 src/Storages/Kafka/KafkaProducer.cpp               |  2 +-
 src/Storages/RocksDB/EmbeddedRocksDBBulkSink.cpp   |  4 ++--
 src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp    |  2 +-
 34 files changed, 78 insertions(+), 84 deletions(-)

diff --git a/src/Access/AccessBackup.cpp b/src/Access/AccessBackup.cpp
index 1110b9c4b21..90effdab70f 100644
--- a/src/Access/AccessBackup.cpp
+++ b/src/Access/AccessBackup.cpp
@@ -93,8 +93,6 @@ namespace
                         break;
                     }
 
-                    size_t id_endpos = line.find('\t');
-                    String id_as_string = line.substr(0, id_endpos);
                     UUID id = parse<UUID>(line);
                     line.clear();
 
diff --git a/src/Access/AccessRights.cpp b/src/Access/AccessRights.cpp
index a87e9361e8e..09a610f5b85 100644
--- a/src/Access/AccessRights.cpp
+++ b/src/Access/AccessRights.cpp
@@ -241,11 +241,11 @@ namespace
 
     enum Level
     {
-        GLOBAL_LEVEL,
-        DATABASE_LEVEL,
+        GLOBAL_LEVEL = 0,
+        DATABASE_LEVEL = 1,
         GLOBAL_WITH_PARAMETER = DATABASE_LEVEL,
-        TABLE_LEVEL,
-        COLUMN_LEVEL,
+        TABLE_LEVEL = 2,
+        COLUMN_LEVEL = 3,
     };
 
     AccessFlags getAllGrantableFlags(Level level)
diff --git a/src/Access/AuthenticationData.cpp b/src/Access/AuthenticationData.cpp
index a4c25b438e8..a32215f3d92 100644
--- a/src/Access/AuthenticationData.cpp
+++ b/src/Access/AuthenticationData.cpp
@@ -118,13 +118,16 @@ void AuthenticationData::setPassword(const String & password_)
     switch (type)
     {
         case AuthenticationType::PLAINTEXT_PASSWORD:
-            return setPasswordHashBinary(Util::stringToDigest(password_));
+            setPasswordHashBinary(Util::stringToDigest(password_));
+            return;
 
         case AuthenticationType::SHA256_PASSWORD:
-            return setPasswordHashBinary(Util::encodeSHA256(password_));
+            setPasswordHashBinary(Util::encodeSHA256(password_));
+            return;
 
         case AuthenticationType::DOUBLE_SHA1_PASSWORD:
-            return setPasswordHashBinary(Util::encodeDoubleSHA1(password_));
+            setPasswordHashBinary(Util::encodeDoubleSHA1(password_));
+            return;
 
         case AuthenticationType::BCRYPT_PASSWORD:
         case AuthenticationType::NO_PASSWORD:
@@ -146,7 +149,7 @@ void AuthenticationData::setPasswordBcrypt(const String & password_, int workfac
     if (type != AuthenticationType::BCRYPT_PASSWORD)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot specify bcrypt password for authentication type {}", toString(type));
 
-    return setPasswordHashBinary(Util::encodeBcrypt(password_, workfactor_));
+    setPasswordHashBinary(Util::encodeBcrypt(password_, workfactor_));
 }
 
 String AuthenticationData::getPassword() const
diff --git a/src/Access/DiskAccessStorage.cpp b/src/Access/DiskAccessStorage.cpp
index 3c20ef3d102..1b4b6c440b1 100644
--- a/src/Access/DiskAccessStorage.cpp
+++ b/src/Access/DiskAccessStorage.cpp
@@ -71,7 +71,7 @@ namespace
         SCOPE_EXIT(
         {
             if (!succeeded)
-                std::filesystem::remove(tmp_file_path);
+                (void)std::filesystem::remove(tmp_file_path);
         });
 
         /// Write the file.
@@ -302,7 +302,7 @@ void DiskAccessStorage::writeLists()
     }
 
     /// The list files was successfully written, we don't need the 'need_rebuild_lists.mark' file any longer.
-    std::filesystem::remove(getNeedRebuildListsMarkFilePath(directory_path));
+    (void)std::filesystem::remove(getNeedRebuildListsMarkFilePath(directory_path));
     types_of_lists_to_write.clear();
 }
 
@@ -419,7 +419,7 @@ void DiskAccessStorage::removeAllExceptInMemory(const boost::container::flat_set
         const auto & id = it->first;
         ++it; /// We must go to the next element in the map `entries_by_id` here because otherwise removeNoLock() can invalidate our iterator.
         if (!ids_to_keep.contains(id))
-            removeNoLock(id, /* throw_if_not_exists */ true, /* write_on_disk= */ false);
+            (void)removeNoLock(id, /* throw_if_not_exists */ true, /* write_on_disk= */ false);
     }
 }
 
@@ -549,7 +549,7 @@ bool DiskAccessStorage::insertNoLock(const UUID & id, const AccessEntityPtr & ne
     if (name_collision && (id_by_name != id))
     {
         assert(replace_if_exists);
-        removeNoLock(id_by_name, /* throw_if_not_exists= */ false, write_on_disk);
+        removeNoLock(id_by_name, /* throw_if_not_exists= */ false, write_on_disk); // NOLINT
     }
 
     if (id_collision)
diff --git a/src/Access/GrantedRoles.cpp b/src/Access/GrantedRoles.cpp
index bb07cbd6951..e1a23182cc0 100644
--- a/src/Access/GrantedRoles.cpp
+++ b/src/Access/GrantedRoles.cpp
@@ -161,9 +161,9 @@ void GrantedRoles::makeUnion(const GrantedRoles & other)
 
 void GrantedRoles::makeIntersection(const GrantedRoles & other)
 {
-    boost::range::remove_erase_if(roles, [&other](const UUID & id) { return other.roles.find(id) == other.roles.end(); });
+    boost::range::remove_erase_if(roles, [&other](const UUID & id) { return other.roles.find(id) == other.roles.end(); }); // NOLINT
 
-    boost::range::remove_erase_if(roles_with_admin_option, [&other](const UUID & id)
+    boost::range::remove_erase_if(roles_with_admin_option, [&other](const UUID & id) // NOLINT
     {
         return other.roles_with_admin_option.find(id) == other.roles_with_admin_option.end();
     });
diff --git a/src/Access/IAccessStorage.cpp b/src/Access/IAccessStorage.cpp
index 1d6b8d99cd5..ace8c3b5848 100644
--- a/src/Access/IAccessStorage.cpp
+++ b/src/Access/IAccessStorage.cpp
@@ -583,7 +583,7 @@ void IAccessStorage::backup(BackupEntriesCollector & backup_entries_collector, c
         throwBackupNotAllowed();
 
     auto entities = readAllWithIDs(type);
-    boost::range::remove_erase_if(entities, [](const std::pair<UUID, AccessEntityPtr> & x) { return !x.second->isBackupAllowed(); });
+    boost::range::remove_erase_if(entities, [](const std::pair<UUID, AccessEntityPtr> & x) { return !x.second->isBackupAllowed(); }); // NOLINT
 
     if (entities.empty())
         return;
diff --git a/src/Access/LDAPAccessStorage.cpp b/src/Access/LDAPAccessStorage.cpp
index b1f10cd2d49..3206b20b691 100644
--- a/src/Access/LDAPAccessStorage.cpp
+++ b/src/Access/LDAPAccessStorage.cpp
@@ -76,7 +76,7 @@ void LDAPAccessStorage::setConfiguration(const Poco::Util::AbstractConfiguration
         config.keys(prefix, all_keys);
         for (const auto & key : all_keys)
         {
-            if (key == "role_mapping" || key.find("role_mapping[") == 0)
+            if (key == "role_mapping" || key.starts_with("role_mapping["))
                 parseLDAPRoleSearchParams(role_search_params_cfg.emplace_back(), config, prefix_str + key);
         }
     }
@@ -94,7 +94,7 @@ void LDAPAccessStorage::setConfiguration(const Poco::Util::AbstractConfiguration
     role_change_subscription = access_control.subscribeForChanges<Role>(
         [this] (const UUID & id, const AccessEntityPtr & entity)
         {
-            return this->processRoleChange(id, entity);
+            this->processRoleChange(id, entity);
         }
     );
 }
@@ -200,7 +200,7 @@ void LDAPAccessStorage::applyRoleChangeNoLock(bool grant, const UUID & role_id,
 void LDAPAccessStorage::assignRolesNoLock(User & user, const LDAPClient::SearchResultsList & external_roles) const
 {
     const auto external_roles_hash = boost::hash<LDAPClient::SearchResultsList>{}(external_roles);
-    return assignRolesNoLock(user, external_roles, external_roles_hash);
+    assignRolesNoLock(user, external_roles, external_roles_hash);
 }
 
 
diff --git a/src/Access/LDAPClient.cpp b/src/Access/LDAPClient.cpp
index 3a0b82b9a76..b32b1222829 100644
--- a/src/Access/LDAPClient.cpp
+++ b/src/Access/LDAPClient.cpp
@@ -196,7 +196,7 @@ void LDAPClient::handleError(int result_code, String text)
                 }
             });
 
-            ldap_get_option(handle, LDAP_OPT_DIAGNOSTIC_MESSAGE, &raw_message);
+            ldap_get_option(handle, LDAP_OPT_DIAGNOSTIC_MESSAGE, static_cast<void*>(&raw_message));
 
             if (raw_message && *raw_message != '\0')
             {
diff --git a/src/Access/MemoryAccessStorage.cpp b/src/Access/MemoryAccessStorage.cpp
index 999e2c41d0b..791030b9b12 100644
--- a/src/Access/MemoryAccessStorage.cpp
+++ b/src/Access/MemoryAccessStorage.cpp
@@ -106,7 +106,7 @@ bool MemoryAccessStorage::insertNoLock(const UUID & id, const AccessEntityPtr &
     if (name_collision && (id_by_name != id))
     {
         assert(replace_if_exists);
-        removeNoLock(id_by_name, /* throw_if_not_exists= */ true);
+        removeNoLock(id_by_name, /* throw_if_not_exists= */ true); // NOLINT
     }
 
     if (id_collision)
@@ -128,7 +128,7 @@ bool MemoryAccessStorage::insertNoLock(const UUID & id, const AccessEntityPtr &
             }
             return true;
         }
-        removeNoLock(id, /* throw_if_not_exists= */ true);
+        removeNoLock(id, /* throw_if_not_exists= */ true); // NOLINT
     }
 
     /// Do insertion.
@@ -238,7 +238,7 @@ void MemoryAccessStorage::removeAllExceptNoLock(const boost::container::flat_set
         const auto & id = it->first;
         ++it; /// We must go to the next element in the map `entries_by_id` here because otherwise removeNoLock() can invalidate our iterator.
         if (!ids_to_keep.contains(id))
-            removeNoLock(id, /* throw_if_not_exists */ true);
+            removeNoLock(id, /* throw_if_not_exists */ true); // NOLINT
     }
 }
 
diff --git a/src/Access/MultipleAccessStorage.cpp b/src/Access/MultipleAccessStorage.cpp
index 03d690de0bd..a8b508202b5 100644
--- a/src/Access/MultipleAccessStorage.cpp
+++ b/src/Access/MultipleAccessStorage.cpp
@@ -238,7 +238,7 @@ void MultipleAccessStorage::moveAccessEntities(const std::vector<UUID> & ids, co
 
     try
     {
-        source_storage->remove(ids);
+        source_storage->remove(ids); // NOLINT
         need_rollback = true;
         destination_storage->insert(to_move, ids);
     }
diff --git a/src/Access/ReplicatedAccessStorage.cpp b/src/Access/ReplicatedAccessStorage.cpp
index 275672da115..2c4b49de181 100644
--- a/src/Access/ReplicatedAccessStorage.cpp
+++ b/src/Access/ReplicatedAccessStorage.cpp
@@ -616,7 +616,7 @@ void ReplicatedAccessStorage::setEntityNoLock(const UUID & id, const AccessEntit
 void ReplicatedAccessStorage::removeEntityNoLock(const UUID & id)
 {
     LOG_DEBUG(getLogger(), "Removing entity with id {}", toString(id));
-    memory_storage.remove(id, /* throw_if_not_exists= */ false);
+    memory_storage.remove(id, /* throw_if_not_exists= */ false); // NOLINT
 }
 
 
@@ -654,7 +654,7 @@ void ReplicatedAccessStorage::backup(BackupEntriesCollector & backup_entries_col
         throwBackupNotAllowed();
 
     auto entities = readAllWithIDs(type);
-    boost::range::remove_erase_if(entities, [](const std::pair<UUID, AccessEntityPtr> & x) { return !x.second->isBackupAllowed(); });
+    boost::range::remove_erase_if(entities, [](const std::pair<UUID, AccessEntityPtr> & x) { return !x.second->isBackupAllowed(); }); // NOLINT
 
     if (entities.empty())
         return;
diff --git a/src/Access/SettingsConstraints.cpp b/src/Access/SettingsConstraints.cpp
index db805c83e17..fb596d96a55 100644
--- a/src/Access/SettingsConstraints.cpp
+++ b/src/Access/SettingsConstraints.cpp
@@ -190,11 +190,11 @@ void SettingsConstraints::check(const Settings & current_settings, const Setting
 
 void SettingsConstraints::check(const Settings & current_settings, SettingsChanges & changes, SettingSource source) const
 {
-    boost::range::remove_erase_if(
+    boost::range::remove_erase_if( // NOLINT
         changes,
         [&](SettingChange & change) -> bool
         {
-            return !checkImpl(current_settings, const_cast<SettingChange &>(change), THROW_ON_VIOLATION, source);
+            return !checkImpl(current_settings, change, THROW_ON_VIOLATION, source);
         });
 }
 
@@ -211,7 +211,7 @@ void SettingsConstraints::check(const MergeTreeSettings & current_settings, cons
 
 void SettingsConstraints::clamp(const Settings & current_settings, SettingsChanges & changes, SettingSource source) const
 {
-    boost::range::remove_erase_if(
+    boost::range::remove_erase_if( // NOLINT
         changes,
         [&](SettingChange & change) -> bool
         {
diff --git a/src/Backups/BackupIO_File.cpp b/src/Backups/BackupIO_File.cpp
index 35544a526f1..39abd4fa906 100644
--- a/src/Backups/BackupIO_File.cpp
+++ b/src/Backups/BackupIO_File.cpp
@@ -105,7 +105,7 @@ std::unique_ptr<WriteBuffer> BackupWriterFile::writeFile(const String & file_nam
 
 void BackupWriterFile::removeFile(const String & file_name)
 {
-    fs::remove(root_path / file_name);
+    (void)fs::remove(root_path / file_name);
     if (fs::is_directory(root_path) && fs::is_empty(root_path))
         fs::remove(root_path);
 }
@@ -113,9 +113,9 @@ void BackupWriterFile::removeFile(const String & file_name)
 void BackupWriterFile::removeFiles(const Strings & file_names)
 {
     for (const auto & file_name : file_names)
-        fs::remove(root_path / file_name);
+        (void)fs::remove(root_path / file_name);
     if (fs::is_directory(root_path) && fs::is_empty(root_path))
-        fs::remove(root_path);
+        (void)fs::remove(root_path);
 }
 
 void BackupWriterFile::copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
diff --git a/src/Backups/BackupsWorker.cpp b/src/Backups/BackupsWorker.cpp
index 8143fa74a6f..9057dc9d198 100644
--- a/src/Backups/BackupsWorker.cpp
+++ b/src/Backups/BackupsWorker.cpp
@@ -259,23 +259,23 @@ namespace
 enum class BackupsWorker::ThreadPoolId : uint8_t
 {
     /// "BACKUP ON CLUSTER ASYNC" waits in background while "BACKUP ASYNC" is finished on the nodes of the cluster, then finalizes the backup.
-    BACKUP_ASYNC_ON_CLUSTER,
+    BACKUP_ASYNC_ON_CLUSTER = 0,
 
     /// "BACKUP ASYNC" waits in background while all file infos are built and then it copies the backup's files.
-    BACKUP_ASYNC,
+    BACKUP_ASYNC = 1,
 
     /// Making a list of files to copy and copying of those files is always sequential, so those operations can share one thread pool.
-    BACKUP_MAKE_FILES_LIST,
+    BACKUP_MAKE_FILES_LIST = 2,
     BACKUP_COPY_FILES = BACKUP_MAKE_FILES_LIST,
 
     /// "RESTORE ON CLUSTER ASYNC" waits in background while "BACKUP ASYNC" is finished on the nodes of the cluster, then finalizes the backup.
-    RESTORE_ASYNC_ON_CLUSTER,
+    RESTORE_ASYNC_ON_CLUSTER = 3,
 
     /// "RESTORE ASYNC" waits in background while the data of all tables are restored.
-    RESTORE_ASYNC,
+    RESTORE_ASYNC = 4,
 
     /// Restores from backups.
-    RESTORE,
+    RESTORE = 5,
 };
 
 
diff --git a/src/Backups/RestoreCoordinationLocal.cpp b/src/Backups/RestoreCoordinationLocal.cpp
index 4a91b8d95a5..f51d6c0c1d8 100644
--- a/src/Backups/RestoreCoordinationLocal.cpp
+++ b/src/Backups/RestoreCoordinationLocal.cpp
@@ -81,8 +81,6 @@ void RestoreCoordinationLocal::generateUUIDForTable(ASTCreateQuery & create_quer
 
     auto new_uuids = create_query.generateRandomUUID(/* always_generate_new_uuid= */ true);
 
-    String new_query_str = serializeAST(create_query);
-
     {
         std::lock_guard lock{mutex};
         if (find_in_map())
diff --git a/src/Backups/RestorerFromBackup.cpp b/src/Backups/RestorerFromBackup.cpp
index 58268971afe..1a3fdf58cc4 100644
--- a/src/Backups/RestorerFromBackup.cpp
+++ b/src/Backups/RestorerFromBackup.cpp
@@ -798,7 +798,7 @@ void RestorerFromBackup::applyCustomStoragePolicy(ASTPtr query_ptr)
         {
             if (restore_settings.storage_policy.value().empty())
                 /// it has been set to "" deliberately, so the source storage policy is erased
-                storage->settings->changes.removeSetting(setting_name);
+                storage->settings->changes.removeSetting(setting_name); // NOLINT
             else
                 /// it has been set to a custom value, so it either overwrites the existing value or is added as a new one
                 storage->settings->changes.setSetting(setting_name, restore_settings.storage_policy.value());
@@ -838,7 +838,7 @@ void RestorerFromBackup::removeUnresolvedDependencies()
         return true; /// Exclude this dependency.
     };
 
-    tables_dependencies.removeTablesIf(need_exclude_dependency);
+    tables_dependencies.removeTablesIf(need_exclude_dependency); // NOLINT
 
     if (tables_dependencies.getNumberOfTables() != table_infos.size())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Number of tables to be restored is not as expected. It's a bug");
diff --git a/src/Common/NamedCollections/NamedCollectionConfiguration.cpp b/src/Common/NamedCollections/NamedCollectionConfiguration.cpp
index 2bb0dcd9b69..94756d32c8e 100644
--- a/src/Common/NamedCollections/NamedCollectionConfiguration.cpp
+++ b/src/Common/NamedCollections/NamedCollectionConfiguration.cpp
@@ -182,7 +182,9 @@ void listKeys(
     if (enumerate_paths.empty())
         enumerate_paths.push("");
 
-    const bool do_finish = depth >= 0 && --depth < 0;
+    const bool do_finish = depth == 0;
+    if (depth >= 0)
+        --depth;
 
     auto initial_paths = std::move(enumerate_paths);
     enumerate_paths = {};
diff --git a/src/Common/NamedCollections/NamedCollectionUtils.cpp b/src/Common/NamedCollections/NamedCollectionUtils.cpp
index e9b319f02a5..21fa9b64c22 100644
--- a/src/Common/NamedCollections/NamedCollectionUtils.cpp
+++ b/src/Common/NamedCollections/NamedCollectionUtils.cpp
@@ -253,7 +253,7 @@ public:
                 "Cannot remove collection `{}`, because it doesn't exist",
                 collection_name);
         }
-        fs::remove(collection_path);
+        (void)fs::remove(collection_path);
     }
 
 private:
@@ -291,7 +291,7 @@ private:
                 files_to_remove.push_back(current_path);
         }
         for (const auto & file : files_to_remove)
-            fs::remove(file);
+            (void)fs::remove(file);
     }
 
     static ASTCreateNamedCollectionQuery readCreateQueryFromMetadata(
@@ -402,7 +402,7 @@ void loadIfNot()
     if (is_loaded_from_sql && is_loaded_from_config)
         return;
     auto lock = lockNamedCollectionsTransaction();
-    return loadIfNotUnlocked(lock);
+    loadIfNotUnlocked(lock);
 }
 
 void removeFromSQL(const ASTDropNamedCollectionQuery & query, ContextPtr context)
diff --git a/src/Common/NamedCollections/NamedCollections.cpp b/src/Common/NamedCollections/NamedCollections.cpp
index 5b377e94b21..6ee47fd6523 100644
--- a/src/Common/NamedCollections/NamedCollections.cpp
+++ b/src/Common/NamedCollections/NamedCollections.cpp
@@ -100,7 +100,7 @@ void NamedCollectionFactory::add(
     MutableNamedCollectionPtr collection)
 {
     std::lock_guard lock(mutex);
-    return addUnlocked(collection_name, collection, lock);
+    addUnlocked(collection_name, collection, lock);
 }
 
 void NamedCollectionFactory::add(NamedCollectionsMap collections)
@@ -141,7 +141,7 @@ void NamedCollectionFactory::remove(const std::string & collection_name)
 void NamedCollectionFactory::removeIfExists(const std::string & collection_name)
 {
     std::lock_guard lock(mutex);
-    removeIfExistsUnlocked(collection_name, lock);
+    removeIfExistsUnlocked(collection_name, lock); // NOLINT
 }
 
 bool NamedCollectionFactory::removeIfExistsUnlocked(
diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index 403f98360c1..6e1ae87f25e 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -513,49 +513,49 @@ namespace MySQLReplication
                     {
                         UInt8 val = 0;
                         payload.readStrict(reinterpret_cast<char *>(&val), 1);
-                        row.push_back(Field{UInt8{val}});
+                        row.push_back(Field{val});
                         break;
                     }
                     case MYSQL_TYPE_SHORT:
                     {
                         UInt16 val = 0;
                         payload.readStrict(reinterpret_cast<char *>(&val), 2);
-                        row.push_back(Field{UInt16{val}});
+                        row.push_back(Field{val});
                         break;
                     }
                     case MYSQL_TYPE_INT24:
                     {
                         Int32 val = 0;
                         payload.readStrict(reinterpret_cast<char *>(&val), 3);
-                        row.push_back(Field{Int32{val}});
+                        row.push_back(Field{val});
                         break;
                     }
                     case MYSQL_TYPE_LONG:
                     {
                         UInt32 val = 0;
                         payload.readStrict(reinterpret_cast<char *>(&val), 4);
-                        row.push_back(Field{UInt32{val}});
+                        row.push_back(Field{val});
                         break;
                     }
                     case MYSQL_TYPE_LONGLONG:
                     {
                         UInt64 val = 0;
                         payload.readStrict(reinterpret_cast<char *>(&val), 8);
-                        row.push_back(Field{UInt64{val}});
+                        row.push_back(Field{val});
                         break;
                     }
                     case MYSQL_TYPE_FLOAT:
                     {
                         Float32 val = 0;
                         payload.readStrict(reinterpret_cast<char *>(&val), 4);
-                        row.push_back(Field{Float32{val}});
+                        row.push_back(Field{val});
                         break;
                     }
                     case MYSQL_TYPE_DOUBLE:
                     {
                         Float64 val = 0;
                         payload.readStrict(reinterpret_cast<char *>(&val), 8);
-                        row.push_back(Field{Float64{val}});
+                        row.push_back(Field{val});
                         break;
                     }
                     case MYSQL_TYPE_TIMESTAMP:
diff --git a/src/Core/MySQL/MySQLReplication.h b/src/Core/MySQL/MySQLReplication.h
index 3387d952711..a42ee224310 100644
--- a/src/Core/MySQL/MySQLReplication.h
+++ b/src/Core/MySQL/MySQLReplication.h
@@ -119,7 +119,7 @@ namespace MySQLReplication
     {
         BINLOG_CHECKSUM_ALG_OFF = 0,
         BINLOG_CHECKSUM_ALG_CRC32 = 1,
-        BINLOG_CHECKSUM_ALG_ENUM_END,
+        BINLOG_CHECKSUM_ALG_ENUM_END = 3,
         BINLOG_CHECKSUM_ALG_UNDEF = 255
     };
 
diff --git a/src/Core/PostgreSQL/insertPostgreSQLValue.cpp b/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
index b507b300769..0ce7222a9a5 100644
--- a/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
+++ b/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
@@ -99,8 +99,7 @@ void insertPostgreSQLValue(
             ReadBufferFromString in(value);
             time_t time = 0;
             readDateTimeText(time, in, assert_cast<const DataTypeDateTime *>(data_type.get())->getTimeZone());
-            if (time < 0)
-                time = 0;
+            time = std::max<time_t>(time, 0);
             assert_cast<ColumnUInt32 &>(column).insertValue(static_cast<UInt32>(time));
             break;
         }
@@ -217,8 +216,7 @@ void preparePostgreSQLArrayInfo(
             ReadBufferFromString in(field);
             time_t time = 0;
             readDateTimeText(time, in, assert_cast<const DataTypeDateTime *>(nested.get())->getTimeZone());
-            if (time < 0)
-                time = 0;
+            time = std::max<time_t>(time, 0);
             return time;
         };
     else if (which.isDateTime64())
@@ -227,8 +225,7 @@ void preparePostgreSQLArrayInfo(
             ReadBufferFromString in(field);
             DateTime64 time = 0;
             readDateTime64Text(time, 6, in, assert_cast<const DataTypeDateTime64 *>(nested.get())->getTimeZone());
-            if (time < 0)
-                time = 0;
+            time = std::max<time_t>(time, 0);
             return time;
         };
     else if (which.isDecimal32())
diff --git a/src/Databases/PostgreSQL/DatabasePostgreSQL.cpp b/src/Databases/PostgreSQL/DatabasePostgreSQL.cpp
index 3f62b9719d2..136fb7fd6d2 100644
--- a/src/Databases/PostgreSQL/DatabasePostgreSQL.cpp
+++ b/src/Databases/PostgreSQL/DatabasePostgreSQL.cpp
@@ -241,7 +241,7 @@ void DatabasePostgreSQL::attachTable(ContextPtr /* context_ */, const String & t
 
     fs::path table_marked_as_removed = fs::path(getMetadataPath()) / (escapeForFileName(table_name) + suffix);
     if (fs::exists(table_marked_as_removed))
-        fs::remove(table_marked_as_removed);
+        (void)fs::remove(table_marked_as_removed);
 }
 
 
@@ -298,7 +298,7 @@ void DatabasePostgreSQL::dropTable(ContextPtr, const String & table_name, bool /
 
 void DatabasePostgreSQL::drop(ContextPtr /*context*/)
 {
-    fs::remove_all(getMetadataPath());
+    (void)fs::remove_all(getMetadataPath());
 }
 
 
@@ -368,7 +368,7 @@ void DatabasePostgreSQL::removeOutdatedTables()
             iter = detached_or_dropped.erase(iter);
             fs::path table_marked_as_removed = fs::path(getMetadataPath()) / (escapeForFileName(table_name) + suffix);
             if (fs::exists(table_marked_as_removed))
-                fs::remove(table_marked_as_removed);
+                (void)fs::remove(table_marked_as_removed);
         }
         else
             ++iter;
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.h b/src/Disks/ObjectStorages/DiskObjectStorage.h
index 787937af846..fe8a5e2844a 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.h
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.h
@@ -4,9 +4,9 @@
 #include <Disks/ObjectStorages/IObjectStorage.h>
 #include <Disks/ObjectStorages/DiskObjectStorageRemoteMetadataRestoreHelper.h>
 #include <Disks/ObjectStorages/IMetadataStorage.h>
-#include <Disks/ObjectStorages/DiskObjectStorageTransaction.h>
 #include <Common/re2.h>
 
+
 namespace CurrentMetrics
 {
     extern const Metric DiskSpaceReservedForMerge;
diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
index 071b2ff4613..faa7ca38b75 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
@@ -158,7 +158,7 @@ void MetadataStorageFromPlainObjectStorageTransaction::createDirectory(const std
 
 void MetadataStorageFromPlainObjectStorageTransaction::createDirectoryRecursive(const std::string & path)
 {
-    return createDirectory(path);
+    createDirectory(path);
 }
 
 void MetadataStorageFromPlainObjectStorageTransaction::moveDirectory(const std::string & path_from, const std::string & path_to)
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
index a58b37f1df9..043e5b8ef8c 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
@@ -557,7 +557,6 @@ std::unique_ptr<IObjectStorage> S3ObjectStorage::cloneObjectStorage(
 {
     auto new_s3_settings = getSettings(config, config_prefix, context);
     auto new_client = getClient(config, config_prefix, context, *new_s3_settings);
-    String endpoint = context->getMacros()->expand(config.getString(config_prefix + ".endpoint"));
 
     auto new_uri{uri};
     new_uri.bucket = new_namespace;
diff --git a/src/Storages/Cache/RemoteCacheController.cpp b/src/Storages/Cache/RemoteCacheController.cpp
index 403d0c8e43b..092cabc7239 100644
--- a/src/Storages/Cache/RemoteCacheController.cpp
+++ b/src/Storages/Cache/RemoteCacheController.cpp
@@ -206,7 +206,7 @@ void RemoteCacheController::close()
     // delete directory
     LOG_TRACE(log, "Removing the local cache. local path: {}", local_path.string());
     if (fs::exists(local_path))
-        fs::remove_all(local_path);
+        (void)fs::remove_all(local_path);
 }
 
 std::unique_ptr<ReadBufferFromFileBase> RemoteCacheController::allocFile()
diff --git a/src/Storages/FileLog/StorageFileLog.cpp b/src/Storages/FileLog/StorageFileLog.cpp
index d3e31101d3b..abd4b4ce23b 100644
--- a/src/Storages/FileLog/StorageFileLog.cpp
+++ b/src/Storages/FileLog/StorageFileLog.cpp
@@ -416,7 +416,7 @@ void StorageFileLog::drop()
 {
     try
     {
-        std::filesystem::remove_all(metadata_base_path);
+        (void)std::filesystem::remove_all(metadata_base_path);
     }
     catch (...)
     {
@@ -1009,7 +1009,7 @@ bool StorageFileLog::updateFileInfos()
                     file_infos.meta_by_inode.erase(meta);
 
                 if (std::filesystem::exists(getFullMetaPath(file_name)))
-                    std::filesystem::remove(getFullMetaPath(file_name));
+                    (void)std::filesystem::remove(getFullMetaPath(file_name));
                 file_infos.context_by_name.erase(it);
             }
             else
diff --git a/src/Storages/HDFS/HDFSCommon.cpp b/src/Storages/HDFS/HDFSCommon.cpp
index f9a55a1285a..9eb0d10cc16 100644
--- a/src/Storages/HDFS/HDFSCommon.cpp
+++ b/src/Storages/HDFS/HDFSCommon.cpp
@@ -113,7 +113,6 @@ HDFSBuilderWrapper createHDFSBuilder(const String & uri_str, const Poco::Util::A
     const Poco::URI uri(uri_str);
     const auto & host = uri.getHost();
     auto port = uri.getPort();
-    const String path = "//";
     if (host.empty())
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Illegal HDFS URI: {}", uri.toString());
 
diff --git a/src/Storages/Hive/StorageHive.cpp b/src/Storages/Hive/StorageHive.cpp
index 88ab8e15e76..b80bf8d7f46 100644
--- a/src/Storages/Hive/StorageHive.cpp
+++ b/src/Storages/Hive/StorageHive.cpp
@@ -921,9 +921,7 @@ void ReadFromHive::initializePipeline(QueryPipelineBuilder & pipeline, const Bui
     }
 
     sources_info->hive_files = std::move(*hive_files);
-
-    if (num_streams > sources_info->hive_files.size())
-        num_streams = sources_info->hive_files.size();
+    num_streams = std::min(num_streams, sources_info->hive_files.size());
 
     Pipes pipes;
     for (size_t i = 0; i < num_streams; ++i)
diff --git a/src/Storages/Hive/StorageHive.h b/src/Storages/Hive/StorageHive.h
index ee4a3a791d6..0fc1e3ff8d9 100644
--- a/src/Storages/Hive/StorageHive.h
+++ b/src/Storages/Hive/StorageHive.h
@@ -70,10 +70,10 @@ private:
 
     enum class PruneLevel : uint8_t
     {
-        None, /// Do not prune
-        Partition,
-        File,
-        Split,
+        None = 0, /// Do not prune
+        Partition = 1,
+        File = 2,
+        Split = 3,
         Max = Split,
     };
 
diff --git a/src/Storages/Kafka/KafkaProducer.cpp b/src/Storages/Kafka/KafkaProducer.cpp
index 77676fb010b..8b7f03c52ed 100644
--- a/src/Storages/Kafka/KafkaProducer.cpp
+++ b/src/Storages/Kafka/KafkaProducer.cpp
@@ -60,7 +60,7 @@ void KafkaProducer::produce(const String & message, size_t rows_in_message, cons
     {
         const auto & timestamp_column = assert_cast<const ColumnUInt32 &>(*columns[timestamp_column_index.value()]);
         const auto timestamp = std::chrono::seconds{timestamp_column.getElement(last_row)};
-        builder.timestamp(timestamp);
+        (void)builder.timestamp(timestamp);
     }
 
     while (!shutdown_called)
diff --git a/src/Storages/RocksDB/EmbeddedRocksDBBulkSink.cpp b/src/Storages/RocksDB/EmbeddedRocksDBBulkSink.cpp
index 9909bf34d7a..7094578a9cc 100644
--- a/src/Storages/RocksDB/EmbeddedRocksDBBulkSink.cpp
+++ b/src/Storages/RocksDB/EmbeddedRocksDBBulkSink.cpp
@@ -100,7 +100,7 @@ EmbeddedRocksDBBulkSink::~EmbeddedRocksDBBulkSink()
     try
     {
         if (fs::exists(insert_directory_queue))
-            fs::remove_all(insert_directory_queue);
+            (void)fs::remove_all(insert_directory_queue);
     }
     catch (...)
     {
@@ -210,7 +210,7 @@ void EmbeddedRocksDBBulkSink::consume(Chunk chunk_)
         throw Exception(ErrorCodes::ROCKSDB_ERROR, "RocksDB write error: {}", status.ToString());
 
     if (fs::exists(sst_file_path))
-        fs::remove(sst_file_path);
+        (void)fs::remove(sst_file_path);
 }
 
 void EmbeddedRocksDBBulkSink::onFinish()
diff --git a/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp b/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
index ad185f8ec2b..01417b8977b 100644
--- a/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
+++ b/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
@@ -211,7 +211,7 @@ void StorageEmbeddedRocksDB::truncate(const ASTPtr &, const StorageMetadataPtr &
     rocksdb_ptr->Close();
     rocksdb_ptr = nullptr;
 
-    fs::remove_all(rocksdb_dir);
+    (void)fs::remove_all(rocksdb_dir);
     fs::create_directories(rocksdb_dir);
     initDB();
 }

From 27b41650f8f3aa66727fcd8d88463f425fbf3192 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 8 May 2024 22:47:25 +0200
Subject: [PATCH 190/289] Fix crash on exit with sentry enabled (due to openssl
 destroyed before sentry)

The problem is tha openssl registers OPENSSL_cleanup() as atexit
handler, which called before destroying of SentryWriter, so to avoid
this problem, let's destroy it explicitly.

<details>

<summary>stack trace example</summary>

    Thread 2 (Thread 0x7ffff54006c0 (LWP 24847) "clickhouse-serv"):
    0  ___pthread_rwlock_rdlock (rwlock=0x0) at pthread_rwlock_rdlock.c:26
    1  0x00000000164c18a9 in CRYPTO_THREAD_read_lock (lock=0x0) at threads_pthread.c:93
    2  0x000000001642e6b9 in int_err_get_item (d=0x7ffff53f74e0) at err.c:192
    ...
    7  ossl_connect_common (cf=0x7ffff7812c80, data=0x7ffff70a4c00, nonblocking=bool_true, done=0x7ffff53f834c) at openssl.c:4486
    ...
    17 curl_easy_perform (data=data@entry=0x7ffff70a4c00) at easy.c:787
    18 0x000000000b4c3854 in sentry__curl_send_task (_envelope=<optimized out>, _state=0x7ffff7074300) at sentry_transport_curl.c:225
    19 0x000000000b4ba880 in worker_thread (data=0x7ffff70e5500) at sentry_sync.c:262

    Thread 1 (Thread 0x7ffff7cb2c80 (LWP 24842) "clickhouse-serv"):
    5  0x000000000b4bb0e2 in sentry__cond_wait_timeout (cv=0x7ffff70e5540, mutex=0x7ffff70e5570, msecs=250) at sentry_sync.h:332
    6  sentry__bgworker_shutdown (bgw=0x7ffff70e5500, timeout=2000) at sentry_sync.c:412
    7  0x000000000b4b3e95 in sentry_close () at sentry_core.c:238
    8  0x000000000b4a5f1f in SentryWriter::~SentryWriter (this=0x7ffff71a1240) at SentryWriter.cpp:147
    9  std::__1::default_delete<SentryWriter>::operator()[abi:v15000](SentryWriter*) const (this=0x7ffff70e5568, __ptr=0x7ffff71a1240) at unique_ptr.h:48
    10 std::__1::unique_ptr<SentryWriter, std::__1::default_delete<SentryWriter> >::reset[abi:v15000](SentryWriter*) (this=0x7ffff70e5568, __p=0x0) at unique_ptr.h:305
    11 std::__1::unique_ptr<SentryWriter, std::__1::default_delete<SentryWriter> >::~unique_ptr[abi:v15000]() (this=0x7ffff70e5568) at unique_ptr.h:259
    12 0x00007ffff7de62e6 in __run_exit_handlers (status=0, listp=<optimized out>, run_list_atexit=run_list_atexit@entry=true, run_dtors=run_dtors@entry=true) at exit.c:108
    13 0x00007ffff7de642e in __GI_exit (status=<optimized out>) at exit.c:138
    14 0x00007ffff7dccd51 in __libc_start_call_main (main=main@entry=0x6111c20 <main(int, char**)>, argc=argc@entry=13, argv=argv@entry=0x7fffffffb718) at libc_start_call_main.h:74
    15 0x00007ffff7dcce0c in __libc_start_main_impl (main=0x6111c20 <main(int, char**)>, argc=13, argv=0x7fffffffb718, init=<optimized out>, fini=<optimized out>, rtld_fini=<optimized out>, stack_end=0x7fffffffb708) at libc-start.c:360

    (gdb) p req.body
    $7 = 0x7ffff7816000 "{\"dsn\":\"...\"}\n{\"type\":\"session\",\"length\":190}\n{\"init\":true,\"sid\":\"...\",\"status\":\"exited\",\"errors\":0,\"started\":\"2024-05-08T20:29:23.253Z\",\"duration\":17.213,\"attrs\":{\"release\":\"24.5\",\"environment\":\"test\"}}"

</details>

P.S. Likely started happens after conversion to OpenSSL (#59870).

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Daemon/BaseDaemon.cpp   | 2 ++
 src/Daemon/SentryWriter.cpp | 5 +++++
 src/Daemon/SentryWriter.h   | 7 +++++++
 3 files changed, 14 insertions(+)

diff --git a/src/Daemon/BaseDaemon.cpp b/src/Daemon/BaseDaemon.cpp
index 1bdf811b588..fdffca9b4ef 100644
--- a/src/Daemon/BaseDaemon.cpp
+++ b/src/Daemon/BaseDaemon.cpp
@@ -706,6 +706,8 @@ BaseDaemon::~BaseDaemon()
         }
 
     signal_pipe.close();
+
+    SentryWriter::resetInstance();
 }
 
 
diff --git a/src/Daemon/SentryWriter.cpp b/src/Daemon/SentryWriter.cpp
index f0f29053088..9479dd65730 100644
--- a/src/Daemon/SentryWriter.cpp
+++ b/src/Daemon/SentryWriter.cpp
@@ -72,6 +72,10 @@ SentryWriter * SentryWriter::getInstance()
 {
     return SentryWriter::instance.get();
 }
+void SentryWriter::resetInstance()
+{
+    SentryWriter::instance.reset();
+}
 
 SentryWriter::SentryWriter(Poco::Util::LayeredConfiguration & config)
 {
@@ -254,6 +258,7 @@ void SentryWriter::sendError(Type type, int sig_or_error, const std::string & er
 
 void SentryWriter::initializeInstance(Poco::Util::LayeredConfiguration &) {}
 SentryWriter * SentryWriter::getInstance() { return nullptr; }
+void SentryWriter::resetInstance() {}
 
 SentryWriter::SentryWriter(Poco::Util::LayeredConfiguration &) {}
 SentryWriter::~SentryWriter() = default;
diff --git a/src/Daemon/SentryWriter.h b/src/Daemon/SentryWriter.h
index ad23c3e5e55..231c8f70047 100644
--- a/src/Daemon/SentryWriter.h
+++ b/src/Daemon/SentryWriter.h
@@ -22,9 +22,16 @@ public:
 
     /// Initialize static SentryWriter instance
     static void initializeInstance(Poco::Util::LayeredConfiguration & config);
+
     /// @return nullptr if initializeInstance() was not called (i.e. for non-server) or SentryWriter object
     static SentryWriter * getInstance();
 
+    /// SentryWriter static instance should be reset explicitly to avoid
+    /// possible use-after-free, since it may use some global objects (i.e.
+    /// OpenSSL), while sending final statistics
+    /// (SENTRY_SESSION_STATUS_EXITED).
+    static void resetInstance();
+
     void onSignal(
         int sig,
         const std::string & error_message,

From a75151e80b7f8c148d574c0b67bfc1430bb1b180 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Thu, 9 May 2024 10:29:35 +0200
Subject: [PATCH 191/289] Undo renaming and make review changes

---
 .../aggregate-functions/index.md              |  2 +-
 ...ll-functions.md => functions-for-nulls.md} | 20 +++++++++----------
 .../sql-reference/statements/select/where.md  |  2 +-
 .../sql-reference/functions/null-functions.md |  2 +-
 .../sql-reference/statements/select/where.md  |  2 +-
 .../sql-reference/functions/null-functions.md |  2 +-
 .../sql-reference/statements/select/where.md  |  2 +-
 7 files changed, 16 insertions(+), 16 deletions(-)
 rename docs/en/sql-reference/functions/{null-functions.md => functions-for-nulls.md} (90%)

diff --git a/docs/en/sql-reference/aggregate-functions/index.md b/docs/en/sql-reference/aggregate-functions/index.md
index bf9ea28daa0..96bf0c5d93b 100644
--- a/docs/en/sql-reference/aggregate-functions/index.md
+++ b/docs/en/sql-reference/aggregate-functions/index.md
@@ -60,7 +60,7 @@ SELECT groupArray(y) FROM t_null_big
 
 `groupArray` does not include `NULL` in the resulting array.
 
-You can use [COALESCE](../../sql-reference/functions/null-functions.md#coalesce) to change NULL into a value that makes sense in your use case. For example: `avg(COALESCE(column, 0))` with use the column value in the aggregation or zero if NULL:
+You can use [COALESCE](../../sql-reference/functions/functions-for-nulls.md#coalesce) to change NULL into a value that makes sense in your use case. For example: `avg(COALESCE(column, 0))` with use the column value in the aggregation or zero if NULL:
 
 ``` sql
 SELECT
diff --git a/docs/en/sql-reference/functions/null-functions.md b/docs/en/sql-reference/functions/functions-for-nulls.md
similarity index 90%
rename from docs/en/sql-reference/functions/null-functions.md
rename to docs/en/sql-reference/functions/functions-for-nulls.md
index 6c39806ecf6..90520145b9d 100644
--- a/docs/en/sql-reference/functions/null-functions.md
+++ b/docs/en/sql-reference/functions/functions-for-nulls.md
@@ -1,5 +1,5 @@
 ---
-slug: /en/sql-reference/functions/null-functions
+slug: /en/sql-reference/functions/functions-for-nulls
 sidebar_position: 135
 sidebar_label: Nullable
 ---
@@ -56,7 +56,7 @@ Result:
 
 ## isNullable
 
-Returns `1` if a column allows null values, `0` otherwise.
+Returns `1` if a column is [Nullable](../data-types/nullable.md) (i.e allows `NULL` values), `0` otherwise.
 
 **Syntax**
 
@@ -78,18 +78,18 @@ isNullable(x)
 Query:
 
 ``` sql
-CREATE TABLE example_table (nullable_column Nullable(UInt32), ordinary_column UInt32) ENGINE = Log;
-INSERT INTO example_table (nullable_column, ordinary_column) VALUES (1,1), (2, 2), (3,3);
-SELECT isNullable(nullable_column), isNullable(ordinary_column) FROM example_table;    
+CREATE TABLE tab (ordinary_col UInt32, nullable_col Nullable(UInt32)) ENGINE = Log;
+INSERT INTO tab (ordinary_col, nullable_col) VALUES (1,1), (2, 2), (3,3);
+SELECT isNullable(ordinary_col), isNullable(nullable_col) FROM tab;    
 ```
 
 Result:
 
 ``` text
-   ┌─isNullable(nullable_column)─┬─isNullable(ordinary_column)─┐
-1. │                           1 │                           0 │
-2. │                           1 │                           0 │
-3. │                           1 │                           0 │
+   ┌───isNullable(ordinary_col)──┬───isNullable(nullable_col)──┐
+1. │                           0 │                           1 │
+2. │                           0 │                           1 │
+3. │                           0 │                           1 │
    └─────────────────────────────┴─────────────────────────────┘
 ```
 
@@ -144,7 +144,7 @@ This function will consider two `NULL` values as identical and will return `true
 equals behavior where comparing two `NULL` values would return `NULL`.
 
 :::note
-This function can only be used as part of a JOIN ON section of a query. The function is unimplemented for any other use.
+This function is an internal function used by the implementation of JOIN ON. Please do not use it manually in queries.
 :::
 
 **Syntax**
diff --git a/docs/en/sql-reference/statements/select/where.md b/docs/en/sql-reference/statements/select/where.md
index 5be05c1d36d..a585942f07f 100644
--- a/docs/en/sql-reference/statements/select/where.md
+++ b/docs/en/sql-reference/statements/select/where.md
@@ -15,7 +15,7 @@ If there is a `WHERE` clause, it must contain an expression with the `UInt8` typ
 There is a filtering optimization called [PREWHERE](../../../sql-reference/statements/select/prewhere.md).
 :::
 
-If you need to test a value for [NULL](../../../sql-reference/syntax.md#null-literal), use [IS NULL](../../operators/index.md#operator-is-null) and [IS NOT NULL](../../operators/index.md#is-not-null) operators or [isNull](../../../sql-reference/functions/null-functions.md#isnull) and [isNotNull](../../../sql-reference/functions/null-functions.md#isnotnull) functions.
+If you need to test a value for [NULL](../../../sql-reference/syntax.md#null-literal), use [IS NULL](../../operators/index.md#operator-is-null) and [IS NOT NULL](../../operators/index.md#is-not-null) operators or [isNull](../../../sql-reference/functions/functions-for-nulls.md#isnull) and [isNotNull](../../../sql-reference/functions/functions-for-nulls.md#isnotnull) functions.
 Otherwise an expression with `NULL` never passes.
 
 **Example**
diff --git a/docs/ru/sql-reference/functions/null-functions.md b/docs/ru/sql-reference/functions/null-functions.md
index d1c26f117ec..9b045d8a97d 100644
--- a/docs/ru/sql-reference/functions/null-functions.md
+++ b/docs/ru/sql-reference/functions/null-functions.md
@@ -212,7 +212,7 @@ SELECT nullIf(1, 2);
 
 ## assumeNotNull {#assumenotnull}
 
-Приводит значение типа [Nullable](../../sql-reference/functions/null-functions.md) к не `Nullable`, если значение не `NULL`.
+Приводит значение типа [Nullable](../../sql-reference/functions/functions-for-nulls.md) к не `Nullable`, если значение не `NULL`.
 
 ``` sql
 assumeNotNull(x)
diff --git a/docs/ru/sql-reference/statements/select/where.md b/docs/ru/sql-reference/statements/select/where.md
index 588c56df6af..10057cdeb84 100644
--- a/docs/ru/sql-reference/statements/select/where.md
+++ b/docs/ru/sql-reference/statements/select/where.md
@@ -14,7 +14,7 @@ ClickHouse использует в выражении индексы, если 
 :::note Примечание
 Существует оптимизация фильтрации под названием [PREWHERE](prewhere.md).
 :::
-Если в секции необходимо проверить [NULL](../../../sql-reference/syntax.md#null-literal), то используйте операторы [IS NULL](../../operators/index.md#operator-is-null) и [IS NOT NULL](../../operators/index.md#is-not-null), а также соответствующие функции [isNull](../../../sql-reference/functions/null-functions.md#isnull) и [isNotNull](../../../sql-reference/functions/null-functions.md#isnotnull). В противном случае выражение будет считаться всегда не выполненным.
+Если в секции необходимо проверить [NULL](../../../sql-reference/syntax.md#null-literal), то используйте операторы [IS NULL](../../operators/index.md#operator-is-null) и [IS NOT NULL](../../operators/index.md#is-not-null), а также соответствующие функции [isNull](../../../sql-reference/functions/functions-for-nulls.md#isnull) и [isNotNull](../../../sql-reference/functions/functions-for-nulls.md#isnotnull). В противном случае выражение будет считаться всегда не выполненным.
 
 **Пример**
 
diff --git a/docs/zh/sql-reference/functions/null-functions.md b/docs/zh/sql-reference/functions/null-functions.md
index 1c38dbb6030..c721bca458c 100644
--- a/docs/zh/sql-reference/functions/null-functions.md
+++ b/docs/zh/sql-reference/functions/null-functions.md
@@ -181,7 +181,7 @@ SELECT coalesce(mail, phone, CAST(icq,'Nullable(String)')) FROM aBook
 
 ## assumeNotNull {#assumenotnull}
 
-将[可为空](../../sql-reference/functions/null-functions.md)类型的值转换为非`Nullable`类型的值。
+将[可为空](../../sql-reference/functions/functions-for-nulls.md)类型的值转换为非`Nullable`类型的值。
 
     assumeNotNull(x)
 
diff --git a/docs/zh/sql-reference/statements/select/where.md b/docs/zh/sql-reference/statements/select/where.md
index ac3debb799e..6c7183840c7 100644
--- a/docs/zh/sql-reference/statements/select/where.md
+++ b/docs/zh/sql-reference/statements/select/where.md
@@ -15,7 +15,7 @@ sidebar_label: WHERE
 有一个叫做过滤优化 [prewhere](../../../sql-reference/statements/select/prewhere.md) 的东西.
 :::
 
-如果需要测试一个 [NULL](../../../sql-reference/syntax.md#null-literal) 值，请使用 [IS NULL](../../operators/index.md#operator-is-null) and [IS NOT NULL](../../operators/index.md#is-not-null) 运算符或 [isNull](../../../sql-reference/functions/null-functions.md#isnull) 和 [isNotNull](../../../sql-reference/functions/null-functions.md#isnotnull) 函数。否则带有 NULL 的表达式永远不会通过。
+如果需要测试一个 [NULL](../../../sql-reference/syntax.md#null-literal) 值，请使用 [IS NULL](../../operators/index.md#operator-is-null) and [IS NOT NULL](../../operators/index.md#is-not-null) 运算符或 [isNull](../../../sql-reference/functions/functions-for-nulls.md#isnull) 和 [isNotNull](../../../sql-reference/functions/functions-for-nulls.md#isnotnull) 函数。否则带有 NULL 的表达式永远不会通过。
 
 **示例**
 

From 16c7ae5a04b834f8e3ad6d3854a40bd1c0688554 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Thu, 9 May 2024 10:30:22 +0200
Subject: [PATCH 192/289] Undo renaming

---
 docs/zh/sql-reference/functions/null-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/zh/sql-reference/functions/null-functions.md b/docs/zh/sql-reference/functions/null-functions.md
index c721bca458c..b3dca3ac549 100644
--- a/docs/zh/sql-reference/functions/null-functions.md
+++ b/docs/zh/sql-reference/functions/null-functions.md
@@ -1,5 +1,5 @@
 ---
-slug: /zh/sql-reference/functions/null-functions
+slug: /zh/sql-reference/functions/functions-for-nulls
 ---
 # Nullable处理函数 {#nullablechu-li-han-shu}
 

From cae27cf7a4d916d007300bfc1e2f172588398877 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Thu, 9 May 2024 10:30:41 +0200
Subject: [PATCH 193/289] Update null-functions.md


From 1aa10b163375ff13d9166021c8ecf608d7af43d0 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Thu, 9 May 2024 10:31:03 +0200
Subject: [PATCH 194/289] Undo renaming

---
 docs/ru/sql-reference/functions/null-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/sql-reference/functions/null-functions.md b/docs/ru/sql-reference/functions/null-functions.md
index 9b045d8a97d..7934b0f68c9 100644
--- a/docs/ru/sql-reference/functions/null-functions.md
+++ b/docs/ru/sql-reference/functions/null-functions.md
@@ -1,5 +1,5 @@
 ---
-slug: /ru/sql-reference/functions/null-functions
+slug: /ru/sql-reference/functions/functions-for-nulls
 sidebar_position: 63
 sidebar_label: "Функции для работы с Nullable-аргументами"
 ---

From ca5e70f424294ca0d6b7a734f4a5eb51c1691973 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Thu, 9 May 2024 10:57:13 +0200
Subject: [PATCH 195/289] Undo file renaming for ru and zh

---
 .../functions/functions-for-nulls.md          | 311 ++++++++++++++++++
 .../functions/functions-for-nulls.md          | 254 ++++++++++++++
 2 files changed, 565 insertions(+)
 create mode 100644 docs/ru/sql-reference/functions/functions-for-nulls.md
 create mode 100644 docs/zh/sql-reference/functions/functions-for-nulls.md

diff --git a/docs/ru/sql-reference/functions/functions-for-nulls.md b/docs/ru/sql-reference/functions/functions-for-nulls.md
new file mode 100644
index 00000000000..7934b0f68c9
--- /dev/null
+++ b/docs/ru/sql-reference/functions/functions-for-nulls.md
@@ -0,0 +1,311 @@
+---
+slug: /ru/sql-reference/functions/functions-for-nulls
+sidebar_position: 63
+sidebar_label: "Функции для работы с Nullable-аргументами"
+---
+
+# Функции для работы с Nullable-аргументами {#funktsii-dlia-raboty-s-nullable-argumentami}
+
+## isNull {#isnull}
+
+Проверяет является ли аргумент [NULL](../../sql-reference/syntax.md#null-literal).
+
+``` sql
+isNull(x)
+```
+
+Синоним: `ISNULL`.
+
+**Аргументы**
+
+-   `x` — значение с не составным типом данных.
+
+**Возвращаемое значение**
+
+-   `1`, если `x` — `NULL`.
+-   `0`, если `x` — не `NULL`.
+
+**Пример**
+
+Входная таблица
+
+``` text
+┌─x─┬────y─┐
+│ 1 │ ᴺᵁᴸᴸ │
+│ 2 │    3 │
+└───┴──────┘
+```
+
+Запрос
+
+``` sql
+SELECT x FROM t_null WHERE isNull(y);
+```
+
+``` text
+┌─x─┐
+│ 1 │
+└───┘
+```
+
+## isNotNull {#isnotnull}
+
+Проверяет не является ли аргумент [NULL](../../sql-reference/syntax.md#null-literal).
+
+``` sql
+isNotNull(x)
+```
+
+**Аргументы**
+
+-   `x` — значение с не составным типом данных.
+
+**Возвращаемое значение**
+
+-   `0`, если `x` — `NULL`.
+-   `1`, если `x` — не `NULL`.
+
+**Пример**
+
+Входная таблица
+
+``` text
+┌─x─┬────y─┐
+│ 1 │ ᴺᵁᴸᴸ │
+│ 2 │    3 │
+└───┴──────┘
+```
+
+Запрос
+
+``` sql
+SELECT x FROM t_null WHERE isNotNull(y);
+```
+
+``` text
+┌─x─┐
+│ 2 │
+└───┘
+```
+
+## coalesce {#coalesce}
+
+Последовательно слева-направо проверяет являются ли переданные аргументы `NULL` и возвращает первый не `NULL`.
+
+``` sql
+coalesce(x,...)
+```
+
+**Аргументы**
+
+-   Произвольное количество параметров не составного типа. Все параметры должны быть совместимы по типу данных.
+
+**Возвращаемые значения**
+
+-   Первый не `NULL` аргумент.
+-   `NULL`, если все аргументы — `NULL`.
+
+**Пример**
+
+Рассмотрим адресную книгу, в которой может быть указано несколько способов связи с клиентом.
+
+``` text
+┌─name─────┬─mail─┬─phone─────┬──icq─┐
+│ client 1 │ ᴺᵁᴸᴸ │ 123-45-67 │  123 │
+│ client 2 │ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ      │ ᴺᵁᴸᴸ │
+└──────────┴──────┴───────────┴──────┘
+```
+
+Поля `mail` и `phone` имеют тип String, а поле `icq` — `UInt32`, его необходимо будет преобразовать в `String`.
+
+Получим из адресной книги первый доступный способ связаться с клиентом:
+
+``` sql
+SELECT coalesce(mail, phone, CAST(icq,'Nullable(String)')) FROM aBook;
+```
+
+``` text
+┌─name─────┬─coalesce(mail, phone, CAST(icq, 'Nullable(String)'))─┐
+│ client 1 │ 123-45-67                                            │
+│ client 2 │ ᴺᵁᴸᴸ                                                 │
+└──────────┴──────────────────────────────────────────────────────┘
+```
+
+## ifNull {#ifnull}
+
+Возвращает альтернативное значение, если основной аргумент — `NULL`.
+
+``` sql
+ifNull(x,alt)
+```
+
+**Аргументы**
+
+-   `x` — значение для проверки на `NULL`,
+-   `alt` — значение, которое функция вернёт, если `x` — `NULL`.
+
+**Возвращаемые значения**
+
+-   Значение `x`, если `x` — не `NULL`.
+-   Значение `alt`, если `x` — `NULL`.
+
+**Пример**
+
+``` sql
+SELECT ifNull('a', 'b');
+```
+
+``` text
+┌─ifNull('a', 'b')─┐
+│ a                │
+└──────────────────┘
+```
+
+``` sql
+SELECT ifNull(NULL, 'b');
+```
+
+``` text
+┌─ifNull(NULL, 'b')─┐
+│ b                 │
+└───────────────────┘
+```
+
+## nullIf {#nullif}
+
+Возвращает `NULL`, если аргументы равны.
+
+``` sql
+nullIf(x, y)
+```
+
+**Аргументы**
+
+`x`, `y` — значения для сравнивания. Они должны быть совместимых типов, иначе ClickHouse сгенерирует исключение.
+
+**Возвращаемые значения**
+
+-   `NULL`, если аргументы равны.
+-   Значение `x`, если аргументы не равны.
+
+**Пример**
+
+``` sql
+SELECT nullIf(1, 1);
+```
+
+``` text
+┌─nullIf(1, 1)─┐
+│         ᴺᵁᴸᴸ │
+└──────────────┘
+```
+
+``` sql
+SELECT nullIf(1, 2);
+```
+
+``` text
+┌─nullIf(1, 2)─┐
+│            1 │
+└──────────────┘
+```
+
+## assumeNotNull {#assumenotnull}
+
+Приводит значение типа [Nullable](../../sql-reference/functions/functions-for-nulls.md) к не `Nullable`, если значение не `NULL`.
+
+``` sql
+assumeNotNull(x)
+```
+
+**Аргументы**
+
+-   `x` — исходное значение.
+
+**Возвращаемые значения**
+
+-   Исходное значение с не `Nullable` типом, если оно — не `NULL`.
+-   Неспецифицированный результат, зависящий от реализации, если исходное значение — `NULL`.
+
+**Пример**
+
+Рассмотрим таблицу `t_null`.
+
+``` sql
+SHOW CREATE TABLE t_null;
+```
+
+``` text
+┌─statement─────────────────────────────────────────────────────────────────┐
+│ CREATE TABLE default.t_null ( x Int8,  y Nullable(Int8)) ENGINE = TinyLog │
+└───────────────────────────────────────────────────────────────────────────┘
+```
+
+``` text
+┌─x─┬────y─┐
+│ 1 │ ᴺᵁᴸᴸ │
+│ 2 │    3 │
+└───┴──────┘
+```
+
+Применим функцию `assumeNotNull` к столбцу `y`.
+
+``` sql
+SELECT assumeNotNull(y) FROM t_null;
+```
+
+``` text
+┌─assumeNotNull(y)─┐
+│                0 │
+│                3 │
+└──────────────────┘
+```
+
+``` sql
+SELECT toTypeName(assumeNotNull(y)) FROM t_null;
+```
+
+``` text
+┌─toTypeName(assumeNotNull(y))─┐
+│ Int8                         │
+│ Int8                         │
+└──────────────────────────────┘
+```
+
+## toNullable {#tonullable}
+
+Преобразует тип аргумента к `Nullable`.
+
+``` sql
+toNullable(x)
+```
+
+**Аргументы**
+
+-   `x` — значение произвольного не составного типа.
+
+**Возвращаемое значение**
+
+-   Входное значение с типом не `Nullable`.
+
+**Пример**
+
+``` sql
+SELECT toTypeName(10);
+```
+
+``` text
+┌─toTypeName(10)─┐
+│ UInt8          │
+└────────────────┘
+```
+
+``` sql
+SELECT toTypeName(toNullable(10));
+```
+
+``` text
+┌─toTypeName(toNullable(10))─┐
+│ Nullable(UInt8)            │
+└────────────────────────────┘
+```
diff --git a/docs/zh/sql-reference/functions/functions-for-nulls.md b/docs/zh/sql-reference/functions/functions-for-nulls.md
new file mode 100644
index 00000000000..b3dca3ac549
--- /dev/null
+++ b/docs/zh/sql-reference/functions/functions-for-nulls.md
@@ -0,0 +1,254 @@
+---
+slug: /zh/sql-reference/functions/functions-for-nulls
+---
+# Nullable处理函数 {#nullablechu-li-han-shu}
+
+## isNull {#isnull}
+
+检查参数是否为[NULL](../../sql-reference/syntax.md#null-literal)。
+
+    isNull(x)
+
+**参数**
+
+-   `x` — 一个非复合数据类型的值。
+
+**返回值**
+
+-   `1` 如果`x`为`NULL`。
+-   `0` 如果`x`不为`NULL`。
+
+**示例**
+
+存在以下内容的表
+
+```response
+┌─x─┬────y─┐
+│ 1 │ ᴺᵁᴸᴸ │
+│ 2 │    3 │
+└───┴──────┘
+```
+
+对其进行查询
+
+```sql
+SELECT x FROM t_null WHERE isNull(y)
+```
+
+```response
+┌─x─┐
+│ 1 │
+└───┘
+```
+
+## isNotNull {#isnotnull}
+
+检查参数是否不为 [NULL](../../sql-reference/syntax.md#null-literal).
+
+    isNotNull(x)
+
+**参数:**
+
+-   `x` — 一个非复合数据类型的值。
+
+**返回值**
+
+-   `0` 如果`x`为`NULL`。
+-   `1` 如果`x`不为`NULL`。
+
+**示例**
+
+存在以下内容的表
+
+```response
+┌─x─┬────y─┐
+│ 1 │ ᴺᵁᴸᴸ │
+│ 2 │    3 │
+└───┴──────┘
+```
+
+对其进行查询
+
+```sql
+SELECT x FROM t_null WHERE isNotNull(y)
+```
+
+```response
+┌─x─┐
+│ 2 │
+└───┘
+```
+
+## 合并 {#coalesce}
+
+检查从左到右是否传递了«NULL»参数并返回第一个非`'NULL`参数。
+
+    coalesce(x,...)
+
+**参数:**
+
+-   任何数量的非复合类型的参数。所有参数必须与数据类型兼容。
+
+**返回值**
+
+-   第一个非’NULL\`参数。
+-   `NULL`，如果所有参数都是’NULL\`。
+
+**示例**
+
+考虑可以指定多种联系客户的方式的联系人列表。
+
+```response
+┌─name─────┬─mail─┬─phone─────┬──icq─┐
+│ client 1 │ ᴺᵁᴸᴸ │ 123-45-67 │  123 │
+│ client 2 │ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ      │ ᴺᵁᴸᴸ │
+└──────────┴──────┴───────────┴──────┘
+```
+
+`mail`和`phone`字段是String类型，但`icq`字段是`UInt32`，所以它需要转换为`String`。
+
+从联系人列表中获取客户的第一个可用联系方式：
+
+```sql
+SELECT coalesce(mail, phone, CAST(icq,'Nullable(String)')) FROM aBook
+```
+
+```response
+┌─name─────┬─coalesce(mail, phone, CAST(icq, 'Nullable(String)'))─┐
+│ client 1 │ 123-45-67                                            │
+│ client 2 │ ᴺᵁᴸᴸ                                                 │
+└──────────┴──────────────────────────────────────────────────────┘
+```
+
+## ifNull {#ifnull}
+
+如果第一个参数为«NULL»，则返回第二个参数的值。
+
+    ifNull(x,alt)
+
+**参数:**
+
+-   `x` — 要检查«NULL»的值。
+-   `alt` — 如果`x`为’NULL\`，函数返回的值。
+
+**返回值**
+
+-   价值 `x`，如果 `x` 不是 `NULL`.
+-   价值 `alt`，如果 `x` 是 `NULL`.
+
+**示例**
+
+    SELECT ifNull('a', 'b')
+
+    ┌─ifNull('a', 'b')─┐
+    │ a                │
+    └──────────────────┘
+
+    SELECT ifNull(NULL, 'b')
+
+    ┌─ifNull(NULL, 'b')─┐
+    │ b                 │
+    └───────────────────┘
+
+## nullIf {#nullif}
+
+如果参数相等，则返回`NULL`。
+
+    nullIf(x, y)
+
+**参数:**
+
+`x`, `y` — 用于比较的值。 它们必须是类型兼容的，否则将抛出异常。
+
+**返回值**
+
+-   如果参数相等，则为`NULL`。
+-   如果参数不相等，则为`x`值。
+
+**示例**
+
+    SELECT nullIf(1, 1)
+
+    ┌─nullIf(1, 1)─┐
+    │         ᴺᵁᴸᴸ │
+    └──────────────┘
+
+    SELECT nullIf(1, 2)
+
+    ┌─nullIf(1, 2)─┐
+    │            1 │
+    └──────────────┘
+
+## assumeNotNull {#assumenotnull}
+
+将[可为空](../../sql-reference/functions/functions-for-nulls.md)类型的值转换为非`Nullable`类型的值。
+
+    assumeNotNull(x)
+
+**参数：**
+
+-   `x` — 原始值。
+
+**返回值**
+
+-   如果`x`不为`NULL`，返回非`Nullable`类型的原始值。
+-   如果`x`为`NULL`，则返回任意值。
+
+**示例**
+
+存在如下`t_null`表。
+
+    SHOW CREATE TABLE t_null
+
+    ┌─statement─────────────────────────────────────────────────────────────────┐
+    │ CREATE TABLE default.t_null ( x Int8,  y Nullable(Int8)) ENGINE = TinyLog │
+    └───────────────────────────────────────────────────────────────────────────┘
+
+    ┌─x─┬────y─┐
+    │ 1 │ ᴺᵁᴸᴸ │
+    │ 2 │    3 │
+    └───┴──────┘
+
+将列`y`作为`assumeNotNull`函数的参数。
+
+    SELECT assumeNotNull(y) FROM t_null
+
+    ┌─assumeNotNull(y)─┐
+    │                0 │
+    │                3 │
+    └──────────────────┘
+
+    SELECT toTypeName(assumeNotNull(y)) FROM t_null
+
+    ┌─toTypeName(assumeNotNull(y))─┐
+    │ Int8                         │
+    │ Int8                         │
+    └──────────────────────────────┘
+
+## 可调整 {#tonullable}
+
+将参数的类型转换为`Nullable`。
+
+    toNullable(x)
+
+**参数：**
+
+-   `x` — 任何非复合类型的值。
+
+**返回值**
+
+-   输入的值，但其类型为`Nullable`。
+
+**示例**
+
+    SELECT toTypeName(10)
+
+    ┌─toTypeName(10)─┐
+    │ UInt8          │
+    └────────────────┘
+
+    SELECT toTypeName(toNullable(10))
+
+    ┌─toTypeName(toNullable(10))─┐
+    │ Nullable(UInt8)            │
+    └────────────────────────────┘

From f294f6d16fd6d4aca051ae2ac01d71925eed9537 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 9 May 2024 12:48:44 +0200
Subject: [PATCH 196/289] Move update_upstream_sync_status to
 commit_status_helper

---
 tests/ci/ci.py                   | 62 +++++---------------------------
 tests/ci/commit_status_helper.py | 57 ++++++++++++++++++++++++++++-
 2 files changed, 65 insertions(+), 54 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index fe68dc32b79..6f72d6b43c2 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -14,8 +14,6 @@ from enum import Enum
 from pathlib import Path
 from typing import Any, Dict, List, Optional, Sequence, Set, Tuple, Union
 
-from github.CommitStatus import CommitStatus
-
 import docker_images_helper
 import upload_result_helper
 from build_check import get_release_or_pr
@@ -34,11 +32,10 @@ from commit_status_helper import (
     RerunHelper,
     format_description,
     get_commit,
-    get_commit_filtered_statuses,
     post_commit_status,
     set_status_comment,
-    trigger_mergeable_check,
     update_mergeable_check,
+    update_upstream_sync_status,
 )
 from digest_helper import DockerDigester, JobDigester
 from env_helper import (
@@ -57,7 +54,7 @@ from git_helper import GIT_PREFIX, Git
 from git_helper import Runner as GitRunner
 from github_helper import GitHub
 from pr_info import PRInfo
-from report import ERROR, SUCCESS, BuildResult, JobReport, get_status
+from report import ERROR, SUCCESS, BuildResult, JobReport
 from s3_helper import S3Helper
 from synchronizer_utils import SYNC_BRANCH_PREFIX
 from version_helper import get_version_from_repo
@@ -1910,51 +1907,6 @@ def _get_ext_check_name(check_name: str) -> str:
     return check_name_with_group
 
 
-def update_upstream_a_sync(
-    pr_info: PRInfo,
-    gh: GitHub,
-    mergeable_status: CommitStatus,
-) -> None:
-    pr_number = int(pr_info.head_ref.split("/pr/", maxsplit=1)[1])
-    upstream_repo = gh.get_repo(GITHUB_UPSTREAM_REPOSITORY)
-    upstream_pr = upstream_repo.get_pull(pr_number)
-    sync_repo = gh.get_repo(GITHUB_REPOSITORY)
-    sync_pr = sync_repo.get_pull(pr_info.number)
-    # Find the commit that is in both repos, upstream and cloud
-    sync_commits = sync_pr.get_commits().reversed
-    upstream_commits = upstream_pr.get_commits()
-    # Github objects are compared by _url attribute. We can't compare them directly and
-    # should compare commits by SHA1
-    upstream_shas = [uc.sha for uc in upstream_commits]
-    found = False
-    for commit in sync_commits:
-        try:
-            idx = upstream_shas.index(commit.sha)
-            found = True
-            upstream_commit = upstream_commits[idx]
-        except ValueError:
-            continue
-
-    if not found:
-        print(
-            "No same commits found in upstream and sync repo, most probably force-push"
-        )
-        return
-
-    post_commit_status(
-        upstream_commit,
-        get_status(mergeable_status.state),
-        "",  # let's won't expose any urls from cloud
-        mergeable_status.description,
-        StatusNames.SYNC,
-    )
-    trigger_mergeable_check(
-        upstream_commit,
-        get_commit_filtered_statuses(upstream_commit),
-        True,
-    )
-
-
 def main() -> int:
     logging.basicConfig(level=logging.INFO)
     exit_code = 0
@@ -2251,15 +2203,19 @@ def main() -> int:
                         and mergeable_status
                         and GITHUB_REPOSITORY != GITHUB_UPSTREAM_REPOSITORY
                     ):
-                        update_upstream_a_sync(pr_info, gh, mergeable_status)
-                        pr_number = int(pr_info.head_ref.split("/pr/", maxsplit=1)[1])
+                        upstream_pr_number = int(
+                            pr_info.head_ref.split("/pr/", maxsplit=1)[1]
+                        )
+                        update_upstream_sync_status(
+                            upstream_pr_number, pr_info.number, gh, mergeable_status
+                        )
                         prepared_events = prepare_tests_results_for_clickhouse(
                             pr_info,
                             [],
                             job_report.status,
                             0,
                             job_report.start_time,
-                            f"https://github.com/ClickHouse/ClickHouse/pull/{pr_number}",
+                            f"https://github.com/ClickHouse/ClickHouse/pull/{upstream_pr_number}",
                             StatusNames.SYNC,
                         )
                         prepared_events[0]["test_context_raw"] = args.job_name
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 6421ac6f0db..6f633cb4410 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -18,7 +18,12 @@ from github.IssueComment import IssueComment
 from github.Repository import Repository
 
 from ci_config import CHECK_DESCRIPTIONS, REQUIRED_CHECKS, CheckDescription, StatusNames
-from env_helper import GITHUB_REPOSITORY, GITHUB_RUN_URL, TEMP_PATH
+from env_helper import (
+    GITHUB_REPOSITORY,
+    GITHUB_RUN_URL,
+    GITHUB_UPSTREAM_REPOSITORY,
+    TEMP_PATH,
+)
 from lambda_shared_package.lambda_shared.pr import Labels
 from pr_info import PRInfo
 from report import (
@@ -29,6 +34,7 @@ from report import (
     StatusType,
     TestResult,
     TestResults,
+    get_status,
     get_worst_status,
 )
 from s3_helper import S3Helper
@@ -500,3 +506,52 @@ def trigger_mergeable_check(
         return set_mergeable_check(commit, description, state, hide_url)
 
     return mergeable_status
+
+
+def update_upstream_sync_status(
+    upstream_pr_number: int,
+    sync_pr_number: int,
+    gh: Github,
+    mergeable_status: CommitStatus,
+) -> None:
+    upstream_repo = gh.get_repo(GITHUB_UPSTREAM_REPOSITORY)
+    upstream_pr = upstream_repo.get_pull(upstream_pr_number)
+    sync_repo = gh.get_repo(GITHUB_REPOSITORY)
+    sync_pr = sync_repo.get_pull(sync_pr_number)
+    # Find the commit that is in both repos, upstream and cloud
+    sync_commits = sync_pr.get_commits().reversed
+    upstream_commits = upstream_pr.get_commits()
+    # Github objects are compared by _url attribute. We can't compare them directly and
+    # should compare commits by SHA1
+    upstream_shas = [uc.sha for uc in upstream_commits]
+    found = False
+    for commit in sync_commits:
+        try:
+            idx = upstream_shas.index(commit.sha)
+            found = True
+            upstream_commit = upstream_commits[idx]
+            break
+        except ValueError:
+            continue
+
+    if not found:
+        logging.info(
+            "No same commits found in upstream and sync repo, most probably force-push"
+        )
+        logging.info("Commits in upstream PR:\n %s", ", ".join(upstream_shas))
+        sync_shas = [uc.sha for uc in upstream_commits]
+        logging.info("Commits in sync PR:\n %s", ", ".join(reversed(sync_shas)))
+        return
+
+    post_commit_status(
+        upstream_commit,
+        get_status(mergeable_status.state),
+        "",  # let's won't expose any urls from cloud
+        mergeable_status.description,
+        StatusNames.SYNC,
+    )
+    trigger_mergeable_check(
+        upstream_commit,
+        get_commit_filtered_statuses(upstream_commit),
+        True,
+    )

From 38604eb3bc20c7f23e9975fa373ebb4fd05a4972 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 9 May 2024 12:57:30 +0200
Subject: [PATCH 197/289] Add more logging about the status will be post

---
 tests/ci/commit_status_helper.py | 18 +++++++++++++-----
 1 file changed, 13 insertions(+), 5 deletions(-)

diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 6f633cb4410..0b51d98b479 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -524,6 +524,9 @@ def update_upstream_sync_status(
     # Github objects are compared by _url attribute. We can't compare them directly and
     # should compare commits by SHA1
     upstream_shas = [uc.sha for uc in upstream_commits]
+    logging.info("Commits in upstream PR:\n %s", ", ".join(upstream_shas))
+    sync_shas = [uc.sha for uc in upstream_commits]
+    logging.info("Commits in sync PR:\n %s", ", ".join(reversed(sync_shas)))
     found = False
     for commit in sync_commits:
         try:
@@ -536,16 +539,21 @@ def update_upstream_sync_status(
 
     if not found:
         logging.info(
-            "No same commits found in upstream and sync repo, most probably force-push"
+            "There's no same commits in upstream and sync PRs, probably force-push"
         )
-        logging.info("Commits in upstream PR:\n %s", ", ".join(upstream_shas))
-        sync_shas = [uc.sha for uc in upstream_commits]
-        logging.info("Commits in sync PR:\n %s", ", ".join(reversed(sync_shas)))
         return
 
+    sync_status = get_status(mergeable_status.state)
+    logging.info(
+        "Using commit %s to post the %s status `%s`: [%s]",
+        upstream_commit.sha,
+        sync_status,
+        StatusNames.SYNC,
+        mergeable_status.description,
+    )
     post_commit_status(
         upstream_commit,
-        get_status(mergeable_status.state),
+        sync_status,
         "",  # let's won't expose any urls from cloud
         mergeable_status.description,
         StatusNames.SYNC,

From 2f00ad489a6245a5ddec801f8b1d4d36f0a7efdc Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 9 May 2024 17:06:26 +0200
Subject: [PATCH 198/289] Go back to upstream lz4

---
 .gitmodules | 2 +-
 contrib/lz4 | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.gitmodules b/.gitmodules
index fb72dc6e3ec..28696428e8c 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -6,7 +6,7 @@
 	url = https://github.com/facebook/zstd
 [submodule "contrib/lz4"]
 	path = contrib/lz4
-	url = https://github.com/ClickHouse/lz4
+	url = https://github.com/lz4/lz4
 [submodule "contrib/librdkafka"]
 	path = contrib/librdkafka
 	url = https://github.com/ClickHouse/librdkafka
diff --git a/contrib/lz4 b/contrib/lz4
index ce45a9dbdb0..145f3804ca5 160000
--- a/contrib/lz4
+++ b/contrib/lz4
@@ -1 +1 @@
-Subproject commit ce45a9dbdb059511a3e9576b19db3e7f1a4f172e
+Subproject commit 145f3804ca5ef5482cda0f2a4f6a2d04ba57f965

From 7376fac30cabb2e3163af6e2c93c0b54094fea97 Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Fri, 10 May 2024 00:50:27 +0300
Subject: [PATCH 199/289] Fixed bug

---
 src/Interpreters/HashJoin.cpp | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 33ba1fd2201..276e2349308 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -2342,6 +2342,12 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
                 }
                 process_right_block(block_right);
             }
+
+            /// It means, that we have read all right blocks
+            if (rows_added <= max_joined_block_rows)
+            {
+                reader.reset();
+            }
         }
 
         start_right_block = 0;

From ad5cbc68081cdc91563fb17787eb38b15abf986c Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Fri, 10 May 2024 01:25:08 +0300
Subject: [PATCH 200/289] fixed code and added test

---
 src/Interpreters/HashJoin.cpp                 |   21 +-
 .../00183_cross_join_external.reference       | 1000 +++++++++++++++++
 .../1_stateful/00183_cross_join_external.sql  |    3 +
 3 files changed, 1013 insertions(+), 11 deletions(-)
 create mode 100644 tests/queries/1_stateful/00183_cross_join_external.reference
 create mode 100644 tests/queries/1_stateful/00183_cross_join_external.sql

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 276e2349308..eb38b2b4fe9 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -2292,18 +2292,12 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
 
     size_t rows_left = block.rows();
     size_t rows_added = 0;
-
     for (size_t left_row = start_left_row; left_row < rows_left; ++left_row)
     {
         size_t block_number = 0;
 
         auto process_right_block = [&](const Block & block_right)
         {
-            ++block_number;
-            if (block_number < start_right_block)
-                return;
-
-
             size_t rows_right = block_right.rows();
             rows_added += rows_right;
 
@@ -2319,15 +2313,19 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
 
         for (const Block & compressed_block_right : data->blocks)
         {
+            ++block_number;
+            if (block_number < start_right_block)
+                continue;
+
+            auto block_right = compressed_block_right.decompress();
+            process_right_block(block_right);
             if (rows_added > max_joined_block_rows)
             {
                 break;
             }
-            auto block_right = compressed_block_right.decompress();
-            process_right_block(block_right);
         }
 
-        if (tmp_stream)
+        if (tmp_stream && rows_added <= max_joined_block_rows)
         {
             if (reader == nullptr)
             {
@@ -2336,14 +2334,15 @@ void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed)
             }
             while (auto block_right = reader->read())
             {
+                ++block_number;
+                process_right_block(block_right);
                 if (rows_added > max_joined_block_rows)
                 {
                     break;
                 }
-                process_right_block(block_right);
             }
 
-            /// It means, that we have read all right blocks
+            /// It means, that reader->read() returned {}
             if (rows_added <= max_joined_block_rows)
             {
                 reader.reset();
diff --git a/tests/queries/1_stateful/00183_cross_join_external.reference b/tests/queries/1_stateful/00183_cross_join_external.reference
new file mode 100644
index 00000000000..ec79cc40fe7
--- /dev/null
+++ b/tests/queries/1_stateful/00183_cross_join_external.reference
@@ -0,0 +1,1000 @@
+33553863	http://ultival.1septs
+33553862	http://full%2F4a%2Fartiry/prival Pandar &clid=4832.html?html&lang=ru&lr=2&msid=203&banerid
+33553862	http://full%2F4a%2Fartiry/prival Pandar &clid=4832.html?html&lang=ru&lr=2&msid=203&banerid
+33553742	https://myz.sutoclub
+33553742	https://myz.sutocation{fontaktering=0&session.ru/index.ru/apltras[5]=0&engine_power/user-efender
+33553742	https://myz.sutocation/search?text=коллей и солнце в
+33553161	http://life-pri-burnoe-dlya-and-na-chudopoly
+33553161	http://life-pri-burnoe-dlya-and-na-chudopoly
+33553118	http://news%2F30%2F1.2&name":"30.475065&text=в контакте
+33552544	http://m.yandsearch?text=юнис
+33552455	http://maps.yandex.ru/fashionnya_10000940877/?action-lacost_mob_contakte,facenews/864490.html?accountryasam-full
+33552449	http://top.rbc.ua/погода-харьков&img_url=http://xyyatsya.html&lang=ru&lr=2779077&text=арабатывающих
+33552449	http://top.rbc.ru/yandsearch?text=вання
+33552449	http://top.rbc.ru/yandsearch?text=ванные целевизора&lr=213&msid=2083696&text=как
+33552449	http://top.rbc.ru/yandsearch?clid=90
+33552449	http://top.rbc.ru/onliner.play.php?s=8
+33552449	http://top.rbc.ru/online.ru/disk.ru/video/embed
+33552449	http://top.rbc.ru/online.com.tr/guncel/frl-2/233
+33552449	http://top.rbc.ru/myfics.pulse.ru/yandsearch?lr=48&perialu.net
+33552449	http://top.rbc.ru/myfics.pulscence/2014/91269707723/item/6961%26nid
+33552328	http://kupit-i-lynn-na-vtorders/dokto.ru/touchshie_na_skladnaia-vlozhenshchadki
+33552328	http://kupit-i-lynn-na-tastyagazeta.ru/tverdar.org/bin.ru/viewtopics/174287200029444776ffa1ba91d43030e
+33552216	http://video/58785/?promo=10347&text=фильмы она для
+33552216	http://video/58785/?promo=10347&text=фильмы она для
+33552216	http://finam.intel
+33552216	http://finam.inpearls.html&lang=ru&lr=959&text=вконтаж
+33552099	http://rg.ru/remont_give-schet/shop.novosti/2014/9116-spalnyj-so
+33551977	http://search
+33551857	http://yandex.ua/uk/news=articles/485/mode=action=FR,B9
+33551857	http://yandex.ua/uk/news=articles/485/mode=action=FR,B9
+33551857	http://yandex.ua/uk/news=articles/485/mode=action=FR,B9
+33551857	http://yandex.ua/uk/news=articles/485/mode=action=FR,B9
+33551857	http://yandex.ru/public-tools/sanatify=nogeo=0&secret=52436
+33551857	http://yandex.ru/public-tools/sanatify=nogeo=0&secret=52436
+33551857	http://yandex.ru/public-tools/sanatify=nogeo=0&secret=52436
+33551857	http://yandex.ru/2402838/?content=on&_orders_num=4907.html#videos/doxodover/fotostransfer
+33551274	http://mysweet-tavr.ru/yandex.ru/yandsearch?clid=13259827&spn
+33551274	http://mysweet-tam-3-silya
+33551274	http://mysweet-tam-3-silya
+33550899	http://astroisshke
+33550844	http://yandex.ru/cgi-bin/msglist/meshnyi-mezhdunarod
+33550844	http://yandex.ru/?clid=20677839/pro-vospalnii-ot-mashnie_novosti/zakon
+33550801	http://sibdomashnyj-cvet-telej-modanija
+33550801	http://sibdom.net/ru/pozdrav.narutoprague/auto/geneva2014
+33550801	http://sibdom.net/ru/pozdrav.narutoprague/auto/geneva2014
+33550801	http://sibdom.com/top22013/summi-dlya-vsem-yumor_prezidents
+33550801	http://sibdom.com/search
+33550801	http://sibdom.com/search
+33550801	http://sibdom.com/search
+33550801	http://sibdom.com/search
+33550801	http://sibdom.com/search
+33550801	http://sibdom.com/search
+33550801	http://sibdom.com/magayutsya-posle-yontent.ru
+33550801	http://sibdom.29.ru/articles/ya-ukray/doktor
+33550204	http://studio/dist_pink-dis
+33549664	http://gde_timeout=144037&lr=50&from=direcommepage=0&ad_info=ElsdCQRfSVFsBgBTAw
+33549406	http://yandex.ua/user_app_versianfood.com/search?cl4url=1primea-materisi-puloveplane
+33549201	http://fashing.net/testdrive_key=506d9e3dfbd268e6b6630e58&doma
+33549131	http://images/216377821524.13951616
+33549116	https://m.haberler.ru/braun/9408215.shtml&lang=ru
+33549116	https://m.haberler.ru/braun/9408215.shtml&lang=ru
+33549116	https://m.haberler.ru/Kovalidad.fisha.lebek tanka.com.ua/news
+33549091	http://zagrams=bid%3D84841.shtml/ru/store/xml_catalog/view/2014/3
+33549091	http://zagradskaja/2011.18432133/11/maps.yandex.php?promo
+33548853	http://predir%3Fid%3D0%26height%3Daf1ea8a2981
+33548697	http://yandex.ru/jobs/florange_key=&availa-vtornye
+33548648	http://worldoftanks.ru/load.cgi%3Fsid
+33548648	http://worldoftanks.ru/140-seasonvar
+33548648	http://worldoftanks.aspx&refererleniya-bilgisa-roslanding_url
+33548648	http://worldoftanks.aspx&referereezume/vorona.org/news.yandsearch
+33548648	http://worldoftanks.aspx&referereezultator/anne_postami.ru/3628
+33548648	http://worldoftanks.aspx&referereezultator/anne_postami.ru/3628
+33548648	http://worldoftanks.aspx&referereezhischet_dorovideo/search?lr
+33548648	http://worldoftanks.aspx&referereezhimost?q=грузкаопмо
+33548648	http://worldoftanks.aspx&referereezhimost?q=грузкаопмо
+33548648	http://worldoftanks.aspx&referereezhimost?p=5758415845392595002181
+33548648	http://worldoftanks.aspx&referereezhdunarodov.ru/igri7.ru/cher
+33548648	http://worldoftanks.aspx&referereezhdugor.com/webhp?espv=1&ie=UTF
+33548648	http://worldoftanks.aspx&referereezhda-devusher.html&langualeo
+33548648	http://worldoftanks.aspx&referereezhda-devusher.html&langualeo
+33548648	http://worldoftanks.aspx&referereezh&api_resuet
+33548648	http://worldoftanks.aspx&referency=UAH&job_interzhalsya
+33548361	http://wot/htm/wotlauncheskim_tatavni.ru%2F&is_mobile
+33547846	http://yenisafak.com.ua/погода на можно ли скачать контакте&lr=194
+33547361	http://acunn.mk.ru
+33546008	http://yandex.ru/syndyk.ru/yandex.ru/view&idtv=2182
+33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
+33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
+33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
+33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
+33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
+33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
+33545847	http://f5haber7.com/play.php?id=1989605&lr=213&msid=2749/?page
+33545847	http://f5haber7.com/kayintov
+33545847	http://f5haber7.com/kayintov
+33545847	http://f5haber7.com/kayintov
+33545847	http://f5haber7.com/?cid=19842783179368
+33545847	http://f5haber7.com&publications/mysel-omeganovsk/telegraf
+33545847	http://f5haber7.com&publications/67459577859
+33545579	http://mamba.kg/#!/videntnogo-putin-show_doc_LAW
+33545564	http://rnd.kz/poisk.com/iframe
+33545404	http://home/shok_popundem/erohd
+33545404	http://home/lp1/?p=4&t=583906723&text=пошив бюстгальтик
+33545404	http://home/lp1/?p=10&lr=213&text=супер
+33545397	http://mp3/20/139377/link7
+33544214	http://fanatik.ru/00003536430/?gcv_source=wizard&category/4dev.ru/polos.ru/kosmeteo.ua/polit/1741824424/?from=email.ru/yandex.ru
+33543373	http://base.com.tr/firefox/295771534.shtml/ru/news.yandsearch?text=люблю 2 серия скачать
+33543373	http://base.com.tr&user=user_all=76
+33542831	https://e.mail=125456_0.html_params=bid%3D1%26xdm_e=http://news/hotel_2_druzya-trana.ru/3275/?from=odnoklass/page=1#compila-ilici-ayakkan/friendsms.ru/registralizaciya-seriya-rosiya-tv.net/?next=/id/openphX21pbmlzdHZvery
+33542831	https://e.mail.ru/my/#actions_510473759731&text=search.php?show_banner_click_id=-1&custoe
+33542407	http://wot/htm/wot/golder-uyku-3653883720
+33542270	https://moscow/ru/novostranamadi-47312196&acce285092.html/ru/lisi-na-par-liga.net/download
+33542270	https://moscow/ru/live/2014&sociologin=pros-pressage/vladtimeout=14403395141
+33542270	https://moscow/full-up-nnn.ru/index.kz/cars.autoplus-muthisweet.ru/00032014/03/melkova-uvere.html&lang=ru&lr=1946562&win
+33542270	https://moscow/episode-com.tr/dizi-gunleri/kopevsk/?one=zoneid=2073/?frommanduyuruindex.ru/yandex.ru/yandex
+33542270	https://hugesex.tv/th/ญี่ปุ่น-slozhnoe.ua/villa_199855362
+33542006	http://7ya.ru/Video/embed
+33542002	http://gaz/2117/start.tv/?cutter&l10n=ru&lr=56&text=смотреть
+33541260	http://yandex.ru/filmId=ydx&iv=ZLZHVUVlsySgV
+33541260	http://yandex.ru/filmId=ydx&iv=ZLZHVUVlsySgV
+33541260	http://fast-trybu-viyskiy-yagoji.com
+33541260	http://fast-trybu-viyskiy-yagoji.com
+33541260	http://fast-trybu-viyskiy-yagoji.com
+33541260	http://fast-trybu-video/83506.html?themoscow/90/inciden sans-viborsa/#788
+33541222	http://mg.mgshare.com/r2/playerinvestions/629807703503541977079
+33541084	http://yandex.ru/news.yandsearch?text=нара 2 на начнеток&img_url
+33541084	http://yandex.ru/news.yandex.ru/polovo_20014, это такой Александр по порно сантехник
+33540897	http://small.ru/yandex.ru/photosession
+33540564	http://wwww.forexpf.ru/Onliner.ru/spaces.ru/
+33540564	http://wwww.ford_id|8610871/train-danies/skachenie
+33540564	http://wwww.ford-sparolevka.bigmir.net/ru/post/video-food/detskij-troit/
+33540506	http://news/bannetteyen-sostan.ua/kids=67774.1395223/19/chastnikapelleri.gen.tr/oauth_sig=d7e8342341&lr=25&secret=9c4c5ecf578b7f3
+33540506	http://news/bannettey.ru/retarutop&text=в контакте&clid=13953422.1395129/index.ru/my/messa
+33539800	http://clubmansk.rabota
+33539286	http://all/pala-deistvennoreask=1
+33538555	http://kler.ru/video/warplanberri.net/
+33538396	http://finans.html&tld=ru
+33537935	http://yandex.ua/politics/17513810d4fgdTWw..
+33537265	http://yandex.ru/pers/1-0-671-kompyuterologinza.ru/id/111/149/milltext
+33536919	http://aydan&type=2&sort=natik.ua/desktop/in/80949
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=2738
+33536857	http://spartmentHelper&id=24086074727284&t=2&pos=29&hotels.html
+33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
+33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
+33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
+33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
+33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
+33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
+33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
+33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
+33536857	http://spartmentHelper&id=240&text=стоит
+33536857	http://spartmentHelper&id=240&text=герб россия, Республик
+33536771	http://konster.ru/yandsearch?clid=1222/480786176723/?from
+33536771	http://konster.ru/yandsearch?clid=1222/480786176723/?from
+33536771	http://konster.ru/v-rossiya?n=2506461
+33536771	http://konster.ru/v-rossiya?n=2506461
+33536771	http://konster.php?Itemid=217867427535/?refreakinelegraf.html/ru/read.php
+33536771	http://konster.gs.html/russichat/188077.html&former.ru/yandex.ru/0000000762
+33536771	http://konster.gs.html/russichat/188077.html&former.ru/yandex.ru/0000000762
+33536771	http://konster.com/?fb_source=vk&refererigroka-klub
+33536771	http://konster.com/?fb_source=vk&refererigroka-klub
+33536771	http://konster.com.tr/oauth=0&drivery/en/search=Отправильные фильм
+33536771	http://konster.com.tr/newreg=1&auth.rosrees
+33536771	http://konster.com%2Fnews.liga.net/journal
+33536588	http://autone.html&gm=1&lang=ru
+33536164	http://wotlaunchestvij-posts%2F2014/03/20/post.com/en/spravda.ru/neli.html?item_id=040103062&text=set
+33535954	https://e.mail.yandex
+33535840	http://yandex.ru/newsru.com.tr&user_id%3D84845.17.30.13953979&text=саламбрекены
+33535746	http://wot/htm/wotlauncher.html&lang=ru
+33535713	http://amk-widget/?overny
+33535713	http://amk-widget/?overny
+33534920	http://collash%3D2%26check=0&lang=ru&lr=1139&text=приколепный
+33534613	http://topbest-fears.ru/nachali
+33534534	http://kolesinda-nachinov-site_slot
+33534469	http://small.com.tr/gunesia-mona-i-post.ru/yandex.ru/forbes
+33534454	http://favto-referentop.ru/questink.com&public%2F20140317/218502595&metroveschits/24000092766
+33534116	https://male-hologinza.ru/Krist.org/radioveshilapii-2013-06-03-22
+33534056	http://cybers.com/index.ru/krashivai.ru/fp/derinburg/mototours
+33534056	http://cybers.com.ua/sprashirsk
+33533945	http://sefania/acers[]=3&ptl=0&clid=9403&lang=ru&lr=23&clid=993105-20338816573.18858.139539063&acce
+33533945	http://sefania/acers/oley.html?html/ru/video/search?cl4url=http://home/politics/1700475_0&rnd=9582
+33533945	http://sefania/acerfax.ru/Suzuki_zavtrax.com/r/rbc.ru/Mukhi-spletnie-luchat.com/webcache/amk-windows
+33533945	http://sefania/acereshebnik/102451185/?ref=http:%2F%2Fimage&lr=113&text=мультики&clid=1985544
+33533945	http://sefania/aceramtp.info=sw-1349-wh-768-ww-1351&rpt=simages/inbox/728x90/?from=7&templatotv
+33533945	http://sefania/acerambler.ru/Отели
+33533945	http://sefania/acerambler.ru/yandex.ru/yandex.ru/polikar.info
+33533945	http://sefania/acerambler.ru/yandex.ru/hotels/leonliner.bjk.html&lang=ru&lr=213&oprnd=65864284.html?html?stat=0&category/stesi.com
+33533945	http://sefania/acerambler.ru/yandex.ru
+33533945	http://sefania/acerambler.ru/pyat-zhens.ru/recipes-topol-tri-degistemy/messages/index.ru/lg/lg_optik.com/view.html#.UxDJCdiRHsBCx9
+33533945	http://sefania/acerambler.ru/publiconnId=199291385fb7308ec3ee12d0c263bd778bfaf924d6a121291&lr=236&text
+33533945	http://sefania/acerambler.ru/neo2/#inbox/?_1ld=1_10004182473169713.html?html/ru/kaluga.ru/yandex.ua
+33533945	http://sefania/acerambler.ru/neo2/#inbox
+33533945	http://sefania/acerambler.ru/moscowmap.php?p=3&clid=1989274
+33533945	http://sefania/acerambler.ru/menu.ru/yandex.ru/neo2/#inbox/?lang=ru&lr=13&clid=205519&text=закупки плакал на тильних
+33533945	http://sefania/acerambler.ru/list?folder
+33533945	http://sefania/acerambler.ru/inworld of MFP
+33533945	http://sefania/acerambler.ru/from=formit
+33533945	http://sefania/acerambler.ru/disk.ru/yandex
+33533945	http://sefania/acerambler.ru/desk.spb.rabota
+33533945	http://sefania/acerambler.ru/content.ws/grinews.yandsearch=FZ
+33533945	http://sefania/acerambler.ru/commu-dva
+33533945	http://sefania/acerambler.ru/cards.a5ltd
+33533945	http://sefania/acerambler.ru/action=1.29081
+33533945	http://sefania/acerambler.ru/51/dollakov-pro.ru/neo2/#inbox/?lang=ru&lr=65&noreask=1&secret=cook-tv.ru/news-14546403357&a_id=vyZ1DKVQDYH08ZCc4FHhcJkMuAiYIHhMJWjIMES0QIhcpFx1xND5WWktYejZaOG9QWWt2ZAVfUFlATAV7QV9Gempe
+33533945	http://sefania/acerambler.rotahabr.ru/korre/politics/game-online.at.ua/?ll=37.61767/?page=0&pos=6.0.2&vers.ru%2F2014-h154&noreask
+33533945	http://sefania/acerambler.net/ru/theme=default
+33533945	http://sefania/acerambler.mirovanie-foto
+33533945	http://sefania/acerambler.html_part182434
+33533945	http://sefania/acerambler.com/web/webhp?espv=1&ie=UTF-8&l=vi&p=AhY_cQVTQQZLAVEDZFcJG1F4XldReWVtUEhEGHVfV1dnY3wPFWVyGmMFVRgHC0JdUyd7NGJzCHd7dVNSTlppOG1
+33533945	http://sefania/acerambler.com/index.ru
+33533945	http://sefania/acerambler.com/futbol/Russing-skforummaonliner.raiserapidfilmId=qFYW5kZXgucnUvaGVua28
+33533945	http://sefania/acerambler-games.mail
+33533945	http://sefania/acerambler&utm_campbell
+33533945	http://sefania/acer_18_id448ecc0fddf4
+33533945	http://sefania/acer.ru/yandex.ru/?p=3&carfinCar%3D11921052307886.281500.159318&curre.ru/article
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-sum=100&lr=213&noheader
+33533945	http://sefania/acer-dodgeraturalsk/motobralime.ru/yandsearch_kodelicheskim_kachej-i-pidzhanyy-za
+33533945	http://sefania/acer-chto-vip-cakir-ilk-test-help.2gis.ru/postuchastnicyn-prezident.su/forum.ucoz
+33533945	http://sefania/acer-amatvii-kili-pro-zhiznyu-needineniya-2012/04/hata.ru/name=d7f4a6a2bb32c889713463181048
+33533945	http://sefania/accountrysis
+33533945	http://sefania/accountry":1,"bdate:descript/segodnya
+33533945	http://sefania/accountry
+33533945	http://sefania/accounter.start.airline/popular/1/o-patrix.ru/yandsearch?p=175&viewtopic/77-1-0
+33533945	http://sefania/accounter.start.airline.sberbankionline.html?id=1879974,55.7868151049.139540135
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
+33533945	http://sefania/account
+33533945	http://sefania/account
+33533945	http://sefania/account
+33533945	http://sefania/accordsPerPage
+33533945	http://sefania/accords&projects/chto-delat_rassyobse-v-zhit_list
+33533945	http://sefania/accords&projects/12807.html?t=1106/#photo.qip.ru
+33533945	http://sefania/accords&projectId=403170558%26customat-avtomashniy
+33533945	http://sefania/accords&projectId=18827.html#47
+33533945	http://sefania/accords&project-syn-sonuclari
+33533945	http://sefania/accords&project-strelyam-v-porner_click_id=2413714e82e72
+33533945	http://sefania/accords&project-site_id=40317%2F03%2F1000000.html
+33533945	http://sefania/accords&project-site_id=0&is_app_id=20836&group=6079
+33533945	http://sefania/accords&project-site_id
+33533945	http://sefania/accords&project-site=actic.livetv.sx/lenta.ru/moscow
+33533945	http://sefania/accords&project-site.ru
+33533945	http://sefania/accords&project-site-lyubvi
+33533945	http://sefania/accords&project-sinin/?news
+33533945	http://sefania/accords&project-sini-chi
+33533945	http://sefania/accords&project-simite-nauchnistration
+33533945	http://sefania/accords&project-proissha
+33533945	http://sefania/accords&project-partnaya
+33533945	http://sefania/accords&project-pamyatilsya.html/rus/news.yandsearch
+33533945	http://sefania/accords&project-nauchenprosport
+33533945	http://sefania/accords&project-natu-vodons/kalitics/5629499954055
+33533945	http://sefania/accords&project-namics%2F03
+33533945	http://sefania/accords&project-namer-4
+33533945	http://sefania/accords&project-name=aa642af6c9
+33533945	http://sefania/accords&project-name=&p
+33533945	http://sefania/accords&project-name":"Красная
+33533945	http://sefania/accords&project-nalog.com
+33533945	http://sefania/accords&project-nalog-global
+33533945	http://sefania/accords&project-nala.com
+33533945	http://sefania/accords&project-na-zhelises.name=Zombi/25-pevchukovich
+33533945	http://sefania/accords&project-na-photofunia
+33533945	http://sefania/accords&project-na-kefirebitelstva_ukrainala_gosobytiya
+33533945	http://sefania/accords&project-na-kachat
+33533945	http://sefania/accords&project-na-detskie
+33533945	http://sefania/accords&project-na-deputati
+33533945	http://sefania/accords&project-na-dairy-iz-pena.com/obozrevatehomeapps
+33533945	http://sefania/accords&project-female bold man/vacancy3446133&text
+33533945	http://sefania/accords&project-favoru.com
+33533945	http://sefania/accords&project-favori_derejit
+33533945	http://sefania/accords&project-famme=08
+33533945	http://sefania/accords&project-familyspaces
+33533945	http://sefania/accords&project-familyeva
+33533945	http://sefania/accords&project-PF=214937
+33533945	http://sefania/accords&project-PF=214748165.html?ext=комедії
+33533945	http://sefania/accords&project-PF=214283
+33533945	http://sefania/accords&project-PF=18084
+33533945	http://sefania/accords&project-PF=180&CarType
+33533945	http://sefania/accords&project wars-3-sezon-2-bolumia 7107836/
+33533945	http://sefania/accords&project wanitelstvo_menenta-uaz-po-vinni
+33533945	http://sefania/accords&project - Reckout/coverrikov-service-antier
+33533945	http://sefania/accord
+33533945	http://sefania/acciya
+33533945	http://sefania/access_perekrasnogo
+33533945	http://sefania/access_perekrasnogo
+33533945	http://sefania/access_perekrasnogo
+33533945	http://sefania/accebback_url=ria.ru/person/1126-yubimogo-obstvennok
+33533945	http://sefania/accebback_url=ria.ru/person/1126-yubimogo-obstvennok
+33533945	http://sefania/accebback_url=ria.ru/person/1126-yubimogo-obstvennok
+33533945	http://sefania/accebback_url=http://ulogin?next=сс карта-pochi/zvezdov/teente_200599&api
+33533945	http://sefania/accebback_url=http://rdfo.ru/neo2/#inbox/?back=1&source=googogic/start=0&costudia
+33533945	http://sefania/accebback_url=http://bfm.ru/be.php?f=2892.2177/blogs.yandex.ua/category/pass.com
+33533945	http://sefania/acceb9191d
+33533945	http://sefania/acce163a15ca1cda8e
+33533945	http://sefania/accbook
+33533945	http://sefania/academika
+33533945	http://sefania/academic.academo/mazdanie-parner.by/
+33533945	http://sefania/ac/auto.ru/neft-autoStart
+33533945	http://sefania/ac/auto.ru/neft-autoStart
+33533945	http://sefania/ac/auto.ru/neft-autoStart
+33533945	http://sefania/ac/auto.ru/neft-autoStart
+33533945	http://sefania/ac/auto.ru/neft-autoStart
+33533945	http://sefania/ac/auto.ru/neft-autoStart
+33533945	http://sefania/ac/auto.ru/neft-autoStart
+33533945	http://sefania/ac/auto.ru/neft-autoStart
+33533945	http://bonprix.ru/2014/912338.html&lang=ru&lr=20569
+33533815	http://gyps.ru/modul.rambler.ru/welcome/popgun.ru/yandsearch?clid=1923030318/1513475
+33533815	http://gyps.ru/modul.rambler.ru/welcome/popgun.ru/yandsearch?clid=1923030318/1513475
+33533815	http://gyps.ru/modul.rambler.ru/welcome/popgun.ru/yandsearch?clid=1923030318/1513475
+33533815	http://gyps.ru/modul.rambler.ru/deales-posobiyane_iz_kottei-200398904&text=как
+33533815	http://gyps.ru/modul.rambler.ru/deales-posobiyane_iz_kottei-200398904&text=как
+33533706	http://zp.php?carfinTpl%3D//adultmir.ru/yandex.ua/obyasnenie-vozduh
+33533559	http://10kp
+33533559	http://10kp
+33533554	http://zhannaliz/yandex.ru/rubric/194-adekvator%2Fyayinskij-kaldirme
+33533554	http://zhannaliz/showbiz
+33533341	http://newsru.com/webhp?espv=1&ie=UTF
+33532815	http://zerx.ru/moscow/ru/dzerzhd-vipstatuazh-prigotovij-neobraznye_chem/signup/?from=email.ru/sport.ru/news/tits-forums
+33532556	https://expertyj_redir-1440&cation.html&lr=10347-v-rublya-pritsell
+33532217	http://tulus-oblagovopoltsou.com/top100
+33532142	http://image&lr=4&text=часы
+33532021	http://ld.ru/test1.radiorecheski-na-domachnomu-karpatents
+33532021	http://ld.ru/test-dney-payi-teknology.ru/tzarin-durnals.tv/movies.ru/prom.news.ru%2Fimg1.livejournal
+33531865	http://wotlauncher/frau-line
+33530939	http://pda.net/downloader_ben_10_legend.ru
+33530939	http://pda.net/download/zapgames.ru/vidyat-lyubov.com.tr&callback=1&search?lr=65&redircnt=13952471887
+33530939	http://pda.net/download/tv_taris-yerel-i-grania/sale/48828-fin.html
+33530939	http://pda.net/download.html?html?id=1955405805/24/market.ru/inbox/?lang=ru&lr=213&text=санкции Детский
+33530767	http://e.mail.rambler.ru/idei.ru/yandex
+33530735	http://rambler.ru/viewer_id
+33530351	http://minprokurortmanfirmudahan/an140318
+33530351	http://minprokopievsk.ru/kiev.pro/commepage=0&sid=8082872.139517112091842&win=111139518073.shmini-aviabil-footovit
+33530351	http://minproklassniki.ru/mozila-fokushek.html&lang=ru&lr=14&l=map,trfe&trfm=cursii-otvetics%2Fpremika_karmens.com.html?pid=90991
+33530351	http://minproki.ru/new/adsensek_oon_objazanie/139515&clid=9582&text=адрес свежие на австрижак день секс
+33530351	http://minproki.com/erike-dlya-bgg108348/1243669&sig=6baa7f9d6b799548339/?promeclipy/1-1-600-1-0-200713/?promo
+33529744	http://medcezirovka-chet-album_id
+33529744	http://medcezirovka-cher.html&language
+33529548	http://tyzhdenii_kryim_v_hers/4608&#96086_14
+33529548	http://tyzhdenii_kryim_v_hers/4608&#96086_14
+33529548	http://tyzhdenii_kryim_v_hers/4608&#96086_14
+33529548	http://tyzhdenii_kryim_v_herost-perm=dista
+33529548	http://tyzhdenii_kryim_v_herost-perm=dista
+33529548	http://tyzhdenii_kryim_v_heroes/?id
+33529548	http://tyzhdenii_kryim_v_heroes/?id
+33529548	http://tyzhdenii_kryim_v_herkala.hh.ru/neo2/#inbox/?back=141&recipes
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=wDt3YsGMq3A
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=kBGsbFhZHmE
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=kBGsbFhZHmE
+33529548	http://tyzhdenii_kryim_v_here=all&filmId=kBGsbFhZHmE
+33529548	http://tyzhdenie.biz/arabatyur-percy/
+33529548	http://tyzhden.ua/news.tut
+33529494	http://pozdravov/politics/101.184574
+33529494	http://pozdravlenii-v-rossiya
+33529346	http://yandex.ru/image&lr=65&text=провение
+33529346	http://yandex.ru/image&lr=65&text=жажданство
+33529300	http://yandsearch?text=стасия","last/woid/igra.html/Article-16.html#object.ru/aim_minutes=0&page/13955768&spn=0.2373&is_settis
+33529300	http://yandsearch?text=спертеристика
+33529300	http://yandsearch?text=спертеристика
+33529300	http://yandsearch?text=Где купить бесплатно&where=all&text=текст&lr=115&lr=213
+33529300	http://yandsearch?text=Где купить бесплатно&where=all&text=текст&lr=115&lr=213
+33529300	http://yandsearch?text=Где купить бесплатно по волчонок
+33529300	http://yandsearch?cl4url=wwww.rg.ru/inregistercontent%3D52%26width%3Dhttp://tatskoy-bolum.html/ru/filmId=c172
+33529300	http://yandsearch?cl4url=wwww.rg.ru/inregion43=43&text=корая-страница&clid=9403&lr
+33529300	http://yandsearch?cl4url=wwww.radikal.com.tr/Umutsu-ve-en3.html&sig=7c2bd3852134
+33528566	http://mudrosti.ru/cgi-bin/msglishero-vsemag.ru/yandsearch
+33528516	http://amkspo-2010-03-2012-30-let-siti.ru/custoshok-video/searcher
+33528246	http://auto.yandsearch?text=юлия мурмановидео майнкрафт картак 1 серия&clinic/psafe.com/diziizle
+33527130	http://yandsearch?text=в конструкция
+33527130	http://yandex.do&returnir_8833654666.html_parali-vo-ves-shop.com/dom-instroisam.com%2Fsmall.com.ua/neo2/#inbox
+33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
+33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
+33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
+33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
+33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
+33527130	http://yandex.do&returnUrl=http://finance.turmovie/bolshoyvoprostok/62765-fh-585-viyskoy
+33527130	http://yandex.do&returnUrl=%2Fhappy birthday=3713/hotelClass.ru/yandex
+33527130	http://yandex.do&returnUrl=%2Fhappy birthday=3713/hotelClass.ru/yandex
+33527130	http://yandex.do&returnUrl=%2Fhappy birthday=3713/hotelClass.ru/yandex
+33527130	http://yandex.do&returnTo=Q833EiAcUXI&path=wizard%3D1027269.139521023600000&language
+33527130	http://yandex.do&returnTo=Q833EiAcUXI&path=wizard%3D1027269.139521023600000&lang=ru&lr
+33527130	http://yandex.do&returnDateTo=2419171971/?gcv_society/177-yatsya-v-dukhod
+33527130	http://yandex.do&returnDateTo=2419171971/?gcv_society/177-yatsya-v-dukhod
+33527130	http://yandex.do&return&from=link]-250-mercher.html/ru/land-parkompyuterermalinkvac.php/tophotostransonhaber7.com
+33527130	http://yandex.do&return&from=link]-250-mercher.html/ru/land-parkompyuterermalinkvac.php/tophoto.html/ru
+33527130	http://yandex.do&return&from=link]-250-mercher.html/ru/land-parkompyuterermalinkvac.php/tophoto.html/ru
+33527130	http://yandex.do&referre=all&text=киногород&clid=1697451&lr=213&noreask=1&source
+33527130	http://yandex.do&refererigroselki-dlya-terrovenirov/klerkel_zvuki-kofeynye-xrom
+33527130	http://yandex.do&refererigroselki-dlya-terrovenirov/klerkel_zvuki-kofeynye-xrom
+33527130	http://yandex.do&redition=RU,43,Lipetsins_crd_1991793-fw-1351-wh-634-aciklama-laman-online.ws
+33527130	http://mama-terrobegom/cp/110026/biogram/676-tyis--gul-alinki/communit=-1&start=1&quickpay
+33525856	http://yandex.ru/video/search?lr
+33525856	http://yandex.ru/video/embed/659
+33525856	http://yandex.ru/video/embed/659
+33525822	http://yandex.ua/content&viewer_type=0&ad_info.com.ua/news.liga
+33525822	http://yandex.ua/content&viewer.php?routeshant/regist/406-85AB-43F0-92f0-055fea7ep
+33525822	http://yandex.ru/yandex.ru/onlinenie-baisvip.php?query=Беларусь
+33525791	https://megafon_category/1-chtovo/item/3971/?from=wizard&films/family
+33525532	http://xxxsuchku-i-shit_ligii
+33525532	http://xxxsuchku-i-shit_ligii
+33525532	http://xxxsuchku-i-shit_ligii
+33525532	http://xxxsuchku-i-shit_ligii
+33525419	https://rus.ru/Интернышов
+33525419	https://rus.ru/Интернышов
+33525419	https://rus.ru/statyi-i-i-bin/msglistvo
+33525419	https://rus.ru/addriver.ru/?api_url=http://meteo
+33525327	http://yandsearch?lr=213&msid=2083696&from
+33525327	http://yandsearch?lr=213&msid=2&rg_viewcats.aspx
+33525276	http://yandex.ru/neo2/#inbox/?back
+33525276	http://yandex.ru/neo2/#inbox/?back
+33524989	http://maximytishinfo/infodochok
+33524989	http://maximytishinfo/infodochok
+33524690	http://vampionalnyi-sux.com/fr/#ling.net/video/cfa.su/load
+33523429	http://yandex.ru/yandex.ru/yandex
+33523429	http://yandex.ru/yandex
+33523429	http://yandex.ru/rates
+33523021	http://yandex.ru/pro-po-rus-to/today/Visitor-site_id%3D1%26lang
+33523021	http://yandex.ru/flirtina-zdorojnoe
+33523021	http://yandex.ru/flirtina-zdorojnoe
+33523021	http://yandex.php?t=1659.html%3Fid_clips.com
+33523021	http://yandex.do&returnUrl=http
+33523021	http://kinoptice-ruchni_207815367.shtml?html&language
+33523021	http://home-provoloch.ru/yandsearch?text
+33523021	http://home-provoloch.ru/yandex.ru/yandex
+33523021	http://home-provoloch.ru/yandex.ru/views
+33523021	http://home-provoloch.ru/yandex.ru/news.yandex
+33523021	http://home-provoloch.ru/world.guns.all.com
+33523021	http://home-provoloch.ru/word}&referers_android
+33523021	http://home-provoloch.ru/vidomchannerstyle/begemennyy-love
+33523021	http://home-provoloch.ru/video/search?lr=213&msid=292324%2F03%2F2014
+33523021	http://home-provoloch.ru/video.html?pid=b473b0c79b3ab2d0b0d18bd0b10747
+33523021	http://home-provoloch.ru/sluzhil-prografii
+33523021	http://home-provoloch.ru/sluhar-in-cinka
+33523021	http://home-provoloch.ru/semeyen-more/Default.ru/yandex.ru/naborisoedineniya
+33523021	http://home-provoloch.ru/novostika-doktoraya-skoraya-griver.ru/politnyi
+33523021	http://home-provoloch.ru/news.yandsearch?cl4url=wwww.hurriyet.com
+33523021	http://home-provoloch.ru/meetindal_sub=26.04919705/reporno.com.ua
+33523021	http://home-provoloch.ru/index.ru/11638455b9febd2
+33523021	http://home-provoloch.ru/home.net/range&text
+33523021	http://home-provoloch.ru/?yaso-porniac.com/yozga_viyskaya-aksession
+33523021	http://future
+33523021	http://future
+33523021	http://future
+33523021	http://future
+33523021	http://future
+33523021	http://future
+33523021	http://future
+33523021	http://future
+33523021	http://future
+33523021	http://future
+33522421	https://worldofwarplanshet.html/hu/priceli-yayconsultatistart&s=89628/?from=6009155113/ghost%3D6459119&nohead=2&job_index.ru/politics
+33522421	https://worldoftankov-gormovie/6639/doram.ru/moscow/plama-alphant.ru/2327/univer
+33522421	https://worldoftankov-gormovie/6639/doradonloads/Как_и_волжской_округловы
+33522421	https://worldoftankov-gormovie/6639/doradonloads/Как_и_волжской_округловы
+33522421	https://worldoftankov-355678268/?promo&limitings=27103052/?cid=5883-prodam
+33522421	https://worldoftankov-355678268/?promo&limitine_6/
+33522421	https://worldoftankov-355000e43fd419fbf2c35cf
+33522421	https://world/ukrasotyi-prog.html?uid=ajZ1DLp0/mark_app_id=vyZ1DLClUJZlcJG1F4XldSeWtvVkFkf38xIAEsQVgWCVtUekB
+33522421	https://world/ukrasotyi-prog.html?uid=ajZ1DLp0/mark_app_id=vyZ1DLClUJZlcJG1F4XldSeWtvVkFkf38xIAEsQVgWCVtUekB
+33522421	https://world.eu/index.ru/optik.ua/yandsearch?text=стать стихи для с мажор
+33522421	https://world.eu/index.ru/optik.ua/yandsearch?text=смотреть
+33521626	http://yandex.ru/yandsearch?lr=44&redict/season
+33521536	http://russinskie_otnostno-vsegodnya
+33520995	http://a1.s7.fsimg.ria.coccoc.com.br/instruktov_perm.ru/news_6_sot._snt_detay
+33520995	http://a1.s7.fsimg.info/meden-seriya-hollassniki.ru/Oboi
+33520995	http://a1.s7.fsimg.com/vse_seksklyuchenie-igry
+33520995	http://a1.s7.fsimg.chitels/es-model.xml?typ=RET&anbietersburg
+33520995	http://a1.s7.fsimg.avoncon.net.ru/rabota.ru/politics/174880%2F9999996657844.html#top_apress
+33520925	http://yandex.ru/shop/wotlauncher
+33520579	http://traveldudingsportal.ru/sverhosti.ua
+33519953	https://e.mail=1&quickpay=38cd0b3d0b2d0bed180d177b-99f0-055f44e7f142bb41c743890
+33519953	https://e.mail.yandsearch?clid=479802000/000286567.html/ru/news.yandsearch?lr=43&noreask=1&source
+33519953	https://e.mail.yandsearch?clid=479802000/000286567.html/ru/news.yandsearch?lr=43&noreask=1&source
+33519953	https://e.mail.yandsearch?clid=479802000/000286567.html/ru/news.yandsearch?lr=43&noreask=1&source
+33519953	https://e.mail.yandsearch?clid=479802000/000286567.html/ru/news.yandsearch?lr=43&noreask=1&source
+33519953	https://e.mail.yandsearch?clid=1_30008434634632.html?vac_page3/out-of-tanceret545
+33519953	https://e.mail.yandsearch?clid=1_100002c&_cpofid=5310758&text=ГЕРОБРАЗОВОЕ
+33519953	https://e.mail.yandsearch?cl4url=www.milii.ru/politics/1892.32279/product/134.4132/164310231099_2991eaealty
+33519953	https://e.mail.yandex.ru/yandsearch&area=vac&subishi_dlya
+33519953	https://e.mail.yandex.ru/msk/12812112538%26bn%3D3239658%26bt
+33519953	https://e.mail.yandex.ru/msk/12812112538%26bn%3D3239658%26bt
+33519953	https://e.mail.yandex.ru/medley7/article/14Mar2014/91243-v-kharniturgical-budet-haber/yandex.ru/kategory_from=odnoklassniki.ru
+33519953	https://e.mail.yandex.ru/7/champaign=nw&utm
+33519953	https://e.mail.ru/yandex.ru/c/m.exe/htm/wotlauncher.ru/naifl.ru/actualiday=1#video/search?textpesni_duhovke-vozil-ex.ru/?clid=13954055
+33519953	https://e.mail.ru/neo2/#inbox/
+33519953	https://e.mail.ru/neo2/#inbox/
+33519953	https://e.mail.ru/bit2bit.net/209228_900b9018.html?id=c19
+33519953	https://e.mail.ru/beremennok/sharelii.ru&devices-brics/89822/rosbalta.ru/mail.rambler.ru
+33519953	https://e.mail.ru/Portal_onlayn-igrovya/29474?sid=246411740685&country_params=rhost%3D52%26pz%3D11555_Turkey.com/viewer_novily_dlja
+33519674	http://best.kupit.ru/yandex.ru/sankt-petrovishi.ru/2004d3c53
+33519674	http://best.kupit.ru/yandex.ru/sankt-peter=814409631/?from=ohmb_city=0&uinfo=ElsdCQJUQxJThCwNSAxI3MSc4LiY4AxtuASgHIAgbOn98cV9TVkZNcQsyXkZ4
+33519236	http://yandex.ru/page.biz/17/99999/2014/19240&PrefFrend
+33518904	http://rambler.ru/stattorgnut-Krimult
+33518904	http://rambler.ru/stattorg.ua/hobbilein/msglistakeforex
+33518904	http://rambler.ru/stattorg.ua/hobbile
+33518904	http://rambler.ru/stattorg.ru/106460a
+33518904	http://rambler.net/5927&text=говориль  
+33518904	http://rambler.net/5927&text=говориль  
+33518406	http://delta/htm/wot/htm/wotlauncher.ru/prography.html 
+33518406	http://delta/htm/wot/htm/wotlauncher.ru/prography.html 
+33518406	http://delta/htm/wot/htm/wotlauncher.ru/prography.html 
+33518384	http://svprestatusi_prede
+33518384	http://svpressid=238&lr=63
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpressages.yandex.ru/ekonov
+33518384	http://svpress.ykt.ru
+33518384	http://svpress.yandex.ru/yandex.ru/memoryachi/zhere
+33518384	http://svpress.yandex.ru/questions/volgogram/1-koman
+33518384	http://svpress.yandex.ru/messabota
+33518384	http://svpress.com/webhp?espv=1&ie=UTF-8&l=vi&p
+33518384	http://svpress.com/webhp?espv=1&ie=UTF-8&l=vi&p
+33518384	http://svpress.com/staforizaciya-anars.com.tr&user
+33518384	http://svpress.com/staforizaciya-anars.com.tr&user
+33518384	http://svpress.com/istanoy-v
+33518384	http://svpress.com/apps&lc_name
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chulkax-v-dengangbalta
+33518384	http://svpress-chto-dizajn-trip.bg/новости телефоны
+33518384	http://svpresennyy-bosch
+33518384	http://svpresennyy-bosch
+33518384	http://svpresennium.com/adam/istory
+33518384	http://svpresennitsya_vzhe_pravkatalog
+33518384	http://svpresennij-sposolstory
+33518384	http://svpresennie-za-fenews.mail.ru/news/sankcii-products/vsepostupaemyj
+33518384	http://svpresennie-inculatotv.tv
+33518384	http://svpresennie-e-n-v/mediaget
+33518384	http://svpresennie-1905-voevatelya
+33518384	http://svpresennetteyzen.com/categoryId
+33518384	http://svpresennet.ua/yandsearch?cl4url=rusnoe-komani
+33518384	http://svpresennet.ua/news.yandex
+33518384	http://svpresennet.com/load/gta_4_godetoedet
+33518384	http://svpresennet.com/load/godonskim.html
+33518384	http://svpresennet.com/ghitsya-vzjali
+33518384	http://svpresennet.com/?cid=1_843
+33518384	http://svpresennet.com.tr/D/Genel
+33518384	http://svpresennet.com.tr/?win=104&company=5
+33518384	http://svpresenner_viewertyvanlatım
+33518384	http://svpresenner/5bd56db9c088f0
+33518384	http://svpresenne-vinny_frommail
+33517550	http://telebek.com/notification.by/yandsearch.html
+33516942	http://yandex.ua/describe.ru/yandex.ru/kak-managemennoletat
+33516942	http://yandex.ua/Shou-biri-dnjatija-vo-vremennoafishin/zhensk.ua/ukranov/56
+33516934	http://news.yandex.ua/world
+33516664	http://yandex.ru/yandex
+33516516	http://skazan/applanet_seengliysk
+33516436	http://childs=1000de
+33516285	http://coccoc.com/Informalnaya-trax.com.ru/politics
+33516126	http://forum.horo.mail.ru/volgoprove-did39
+33515878	http://yandex.ru/city=&name=Индийского развитие
+33515401	http://rg.ru%2Fplatno-kurganizmantasy-loko.ru/games.mail.yandsearch?cl4url=http://worldoftanks.ru/news/231518
+33515401	http://rg.ru%2Fplatno-kurganizmantasy-loko.ru/games.mail.yandsearch?cl4url=http://worldoftanks.ru/news/231518
+33515401	http://rg.ru%2Fplatno-kurganizmantasy-lohanks.eu/play.ru/autop&text=чемпионов зодиака смотреть фиат альма новые-вычет зубна&clid=1979770d066e1
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515401	http://rg.ru%2Fplanet.ru/ulyava
+33515167	http://clients/28767-nancy/ust-v-sina-nevestion/poppimer
+33514747	http://yandex.ru/new/ads
+33514322	http://center.ru/daily/svadba
+33513741	http://cum.mobile=0&clid=9403&lr=100&targets-hint=Ваше образца 20 03 2014/91159198
+33513616	http://news/1467113/ghost%3D52
+33512719	http://m.net/ukrinfo=ww-1263
+33512719	http://m.net/join/43-1-0-340138002aa
+33512719	http://m.net/join/43-1-0-340138002aa
+33512719	http://m.net/555/?fromName_geldigitar.com/page.aspx&refplaces
+33512719	http://m.net/548155&text=когда в рошем качество
+33512719	http://m.net/548155&text=когда в рошем качество
+33512719	http://m.net/548155&text=когда в рошем качество
+33512719	http://m.net/548155&text=когда в рошем качество
+33512719	http://m.net/221396/http://news.do?u_krymu-pro.com/webhp
+33512719	http://m.net/219/review/21204%26carfinABTest
+33512719	http://m.net/212549&z=12&lr=20139162721&text
+33512396	http://my.mail.ru/part3.mozi.com/aciklyuchebnoe-prezerogramming.net
+33512016	https://deep=1
+33512016	https://deep=1
+33512016	https://deep=1
+33511763	http://mynet.ua/yandex.ru/product
+33511664	http://yandex.ru/tolko_chit-novye-vyira-Superjob.ru/board
+33511664	http://yandex.ru/pelichkoj.html_partner.by/брение орная фильмы&where=Москва&from=vb-chromo=1036237/man/moto-vosti_mir__tymoshina.html
+33511664	http://yandex.ru/pelichkoj.html_partner.bjk.html/ru/video/embed/6959&referatura.html?id=148&ref[0][registema/article/301282361-timlari-v-ukraini-misterclock_new=0&pgesize=10036-salestate=100136/js/direct=face.com&publ/launcher.html?browsers/62610&text=однокласс
+33511664	http://yandex.ru/pelichkoj.html_parhomchyk_2/?cat=1820273&noreask=1&source=psearch
+33511664	http://yandex.ru/pelichkoj.html_parhomchyk_2/?cat=1820273&noreask=1&source=psearch
+33511664	http://yandex.ru/pelichkoj.html_parhomchelyambler.ru%2Fpolitics.cntd.ru/l/chart
+33511664	http://yandex.ru/pelichkoj.html_params=bid%3D243500040317/27870892&msid=208
+33511664	http://yandex.ru/pelichkoj.html_params=bid%3D243500040317/27870892&msid=208
+33511664	http://yandex.ru/pelichkoj.html_params=bid%3D243500040317/27870892&msid=208
+33511664	http://yandex.ru/pelichkoj.html_paradikal.com/ilanie-obama-lizhnyyeleries/ukraine.ru/?auth_key=a65625a2bd6a1212d8a2109.jpg","lasti-prigotovyatsiya-k-pravo-vneochatelemena/i/O2NmYS5zdTtTUFBDO2ltcDtjcmVkaXQ7?_rnd=2434802143/?frommatiza/
+33511664	http://yandex.ru/pelichkoj.html_para.html/ru/list.ru/yandex.ru/20140316&lr=143
+33511664	http://yandex.ru/messages.yandex.htm
+33511664	http://yandex.ru/cgi-bin/readsale/programmy/igri_bottogovaya
+33511664	http://yandex.ru/cgi-bin/readsale/programmy/igri_bottogovaya
+33511664	http://yandex.ru/catalog/anner
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
+33510595	http://chel.ru/politics/2014/ft/resh-anons
+33509478	http://lenta.php/ru/video/torrealth/next официальные
+33509473	https://m.sprashivai.ru/news.yandsearch[engindex.ru/compeii
+33509211	http://mail.ru/infinited-microchurchi.html&lang=ru&lr=213&text=microssii.com.tr_mobil&id=72217356880
+33509211	http://mail.ru/infinited-microchnolgi-namenila
+33509211	http://mail.ru/infinited-microchnitsa-anneksisozluk.com.tr/yandex.ru/yandsearch?clid=47710/?33vkb
+33509211	http://mail.ru/infinited-microchka-pervy/benetra/detmi/salakomstva.ru/watch/GetInfo/index.ru/vladtime.in.ua/polismetisti
+33509211	http://mail.ru/infinited-microchistkinobig&mb
+33509211	http://mail.ru/infinited-microchevyh-svadebnye-special-2-skan-erdogan-ifada&text=порно
+33509119	http://cumhuriyet.com.ua/ru/legok-novosti-bulation/taunhaus-s-05_2014/03/http://inosty.ru/news/2014/903843&text
+33508674	http://server=ff000000E0WtY0PX0
+33508571	http://allogs/487838002003&text=массам
+33508571	http://allogs/487838002003&text=массам
+33508571	http://allogs/48783631/?frommail.ru/pda.net/gruzoviyah-Pytings/d/depo.ru/series/ural.ru/catalog.ru%2Findex.ru/copypastoyt-na-amonkey
+33508571	http://allogs/48783399760.13954034.html?MG=2
+33508571	http://allogs/487832945-zhizn/zhenskaya/read.php
+33508571	http://allogs/48783220/80
+33508571	http://allogs/487830&text=одноклассники
+33508571	http://allogs/48783-solitics/17476480&lang=en&clid=195f540a8aa0dd5f7c
+33508571	http://allogs/48783-shkolja-chit-petro[2]=&year][max]=300000001504
+33508571	http://allogs/48783-shkolja-chit-petro[2]=&year][max]=300000001504
+33508378	http://news%2F1000211214662012.html?play
+33507942	https://shou-posta-audiovkontent
+33507710	http://tv.yandsearch
+33507710	http://tv.yandsearch
+33507491	https://echo/realth.mail.ru/index.ru/Vidy_na_granpartments.com/menu_id=2055440421.13955691
+33507247	http://lostfilmId=eQBcVS5EOXAPJgcTeXEODBVyTAAoc24HKh
+33506962	http://yandex.ru/peopleniya_kompaniyah-i-skanding
+33506962	http://yandex.ru/peopleniya_kompaniyah-i-skanding
+33506609	http://sprovideolovu.html#44
+33506581	http://yandsearch?clid=9403&lr=35&mb_url=http
+33506211	http://clan.html?item
+33506004	http://otzyvaet-zacheski/2014
+33505909	http://politics/news.mail.ru/2011.ru/yandex.ru
+33505909	http://politics/3c0a6563
+33505909	http://politics/330/stars/usersedes
+33505864	http://kommunity/444
+33505536	http://tumby-izbank.ru/neo2/#inbox/?lang=ru&lr=141
+33505536	http://tumby-iz-droga.com/webhp?espv
+33505536	http://tumby-iz-droga.com/webhp?espv
+33505536	http://tumby-iz-droga.com/webhp?espv
+33505536	http://tumby-iz-droga.com/index.ru/
+33505536	http://tumby-iz-droga.com/index.ru/
+33505536	http://tumby-iz-droga.com/index.ru/
+33505536	http://tumby-iz-droga.com/index.ru/
+33505536	http://tumby-iz-droga.com.tr&callback
+33505536	http://tumby-iz-droga.coccoc.com.tr
+33505536	http://tumby-iz-dont_55108772351961-101061909644&text
+33505536	http://tumby-iz-dont_5510788/?from=splate.yandex
+33505536	http://tumby-iz-doneckout=1440&is_mobile=0&ads_apps.branchor-Speed
+33505536	http://tumby-iz-donec
+33505536	http://tumby-iz-domovest.ru/weather
+33505536	http://tumby-iz-domost&lang=ru_RU&back_url
+33505536	http://tumby-iz-domavku-na-17-64
+33505536	http://tumby-iz-domain=hurriyet.com/detail.ru/news.yandsearch
+33505536	http://tumby-iz-dom2.ru/yandex.ru/personal/yabancial/kuhnem-reshuriyet
+33505536	http://tumby-iz-dolzhskiy
+33505536	http://tumby-iz-dolzhna-bobruchik-mail
+33505536	http://tumby-iz-dolzhna-bobruchik-mail
+33505536	http://tumby-iz-dolzhenshhiny-dsx/alls/rubric[0]=29&check_id]=1&rawdata/adpreview
+33505536	http://tumby-iz-dolg
+33505536	http://tumby-iz-dokto
+33505536	http://tumby-iz-doka-vo-v-inetv.sx/evera-model/27906.html
+33505536	http://tumby-iz-dok.ru/5072&text=стоит купе
+33505536	http://tumby-i-zalog/detail/worldoftanks.ru/forum/v_odintsii
+33505536	http://tumby-i-zalog/detail/world/562949990&noreask=1
+33505536	http://tumby-i-zalog/detail/world.ru/yandex.ru/ecobal
+33505536	http://tumby-i-zalog/detail/womenskaya.net/football/ukraine
+33505536	http://tumby-i-sydney.yandsearch
+33505536	http://tumby-i-sydney
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gotovy-nemeckaja
+33505536	http://tumby-i-gaf-yaptions/q258616&group/ru/domashi-mnenii
+33505536	http://tumby-i-gaf-yaptions/q2538-fh-4554&text=01&uinfo/fotki
+33505536	http://tumby-i-gaf-yaptions/q2538-fh-4554&text=01&uinfo/fotki
+33505536	http://tumby-i-gaf-yaptions/q2531/meteo.ua/cat-maski.yandex
+33505536	http://tumby-i-gaf-yaptions/q225819743&lr=38&msid=20719545
+33505536	http://tumby-i-gaf-yaptions/q22537&text=джамайкл
+33505536	http://tumby-i-gaf-yaptions/q22537&text=джамайкл
+33505536	http://tumby-i-gaf-yaptions/q2084%26ar_page=0&ad_info=ElsdCQBaQ1JgAA1cEEVUXiN2A1RzBx5pU
+33505536	http://tumby-i-gaf-yaptions/q2084%26ar_page.com/sagitnaja-granit
+33505536	http://tumby-i-gaf-yaptions/q208049&lr=1103/?from]=2508&os
+33505536	http://tumby-i-gaf-yaptions/q208&lr=14&msid=22892.1140&domain
+33505536	http://tumby-i-gaf-yaptions/q208&group_id=66289.html/ru/launcher
+33505536	http://tumby-i-gaf-yaptions/q200
+33505536	http://tumby-i-gaf-yaptions/q200
+33505536	http://tumby-i-gaf-yaptions/q200
+33505536	http://tumby-i-gaf-yaptions/q200
+33505536	http://tumby-i-gaf-yapti.ru/video/online
+33505536	http://tumby-i-gaf-yapti.ru/politics/news
+33505536	http://tumby-i-gaf-yapti.ru/politics/17/12/2495.html/ru/Politics
+33505536	http://tumby-i-gaf-yapti.ru/inregion_type
+33505536	http://tumby-i-gaf-yapti.ru/index.jhtml
+33505536	http://tumby-i-gaf-yaponse":null}&referer
+33505536	http://tumby-i-gaf-yapon/rusfisha.yandex.ru/inworld%2F300628431.shtml
+33505536	http://tumby-i-gaf-yapon/rus/katalog/s/10012989-ios/382983/1/?h=f3ea
+33505536	http://tumby-i-gaf-yapon/rukove-wallpaper.ru/yandex.ru/news/news
+33505536	http://tumby-i-gaf-yapon/rukopasnoo.com/beconomi/monstructure.ru
+33505536	http://tumby-i-gaf-yapon/rukol/3444.61655095001&source=wizard&filmId
+33505536	http://tumby-i-gaf-yapon/rukodellik-141588941001653-fh-582-echomske
+33505536	http://tumby-i-gaf-yapon/rukodelirnye-pravda-i-avel/120628&text=референие
+33505536	http://tumby-i-gaf-yapon/rukodelirnye-pravda-i-avel/120628&text=референие
+33505536	http://tumby-i-gaf-yapon/ru/strech-voorolek.com/iframe/frm_index
+33505536	http://tumby-i-gaf-yapon/ru/steko.ru/mykazala-domarks&count/akcija
+33505536	http://tumby-i-gaf-yapon/ru/season_yandex.ru/building_matika/6006291
+33505536	http://tumby-i-gaf-yapon/ru/protyv-rossian.ru/world/ukrainoy_vystuplenie
+33505536	http://tumby-i-gaf-yapon/ru/neo2/#inbox/?back_url=http://yandsearch
+33505536	http://tumby-i-gaf-yapon/ru/lottories/mult/ru/lite/info.ru/yandsearch
+33505536	http://tumby-i-gaf-yapon/ru/launcher.html#post88580657429649.htm
+33505536	http://tumby-i-gaf-yapon/relax.ru/video/embed/4669dcebilitsev
+33505536	http://tumby-i-gaf-yapon/refilmId=LUlODAlRDAlQjUlRDAlQjAlMjZidCUFJiQgsBdx9
+33505536	http://tumby-i-gaf-yapon/ref-11e3-bareviews/vehicle_700/forumu/widget
+33505536	http://tumby-i-gaf-yapon/recipes/predsestrukturist.html_parhomchyk
+33505536	http://tumby-i-gaf-yapon/realtyim-ne-andz.tv/adwidget
+33505536	http://tumby-i-gaf-yapon/realty.ru/studies/catalog.ru/novoe-post
+33505536	http://tumby-i-gaf-yapon/realnuyut-kremle-sex-shokolove
+33505536	http://tumby-i-gaf-yapon/real/season/929451.1395343110877/?actions
+33505536	http://tumby-i-gaf-yapon/reads/vinti-products/view.html?id=79323
+33505536	http://tumby-i-gaf-yapon/readme.ru/free?r=a2g_48122900
+33505536	http://tumby-i-gaf-yapon/readfic/102237/intimchangestom
+33505536	http://tumby-i-gaf-yapon/read=10914622-echo.msk.ru/news.mailbox.ru
+33505536	http://tumby-i-gaf-yapon/read/upravda.com/galimat.com/iframe
+33505536	http://tumby-i-gaf-yapon/read/3474.html?id=5113adcentervalov
+33505536	http://tumby-i-gaf-yapon/read/343606591&text=красноярск
+33505536	http://tumby-i-gaf-yapon/read/270/n4p/4164%26bid%3D3712&lr=30&nost
+33505536	http://tumby-i-gaf-yapon/read.php?page=http://sozdatochet
+33505536	http://tumby-i-gaf-yapon/read.php/Городавцова Наталь
+33505536	http://tumby-i-gaf-yapon/read.adrive-arabota-cekiler/yurthaber
+33505536	http://tumby-i-gaf-yapon/raznyh-orgirl/politics-torreviewtopic/286699416
+33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
+33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
+33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
+33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
+33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
+33505536	http://tumby-i-gaf-yapon/razlozhi.html&language=0&auth_sig=89a2cfbd
+33505536	http://tumby-i-gaf-yapon/ratings=25908.5847&text=вконтроль
+33505536	http://tumby-i-gaf-yapon/rais-list?folder=0&new
+33505536	http://tumby-i-gaf-yapon/rais-list?folder=0&new
+33505536	http://tumby-i-gaf-yapon/rais-list?folder=0&new
+33505536	http://tumby-i-gaf-yapon/rais-list?folder=0&new
+33505536	http://tumby-i-gaf-yapon/raint-pelmenitoff.ru/user=1&auth.aspx?wt
+33505536	http://tumby-i-gaf-yapon/raile.com/list?lang=ru&frame/?lang=ru&clid
+33505536	http://tumby-i-gaf-yapon/rada.com.tr/displat.ru/aboutiquests/creative
diff --git a/tests/queries/1_stateful/00183_cross_join_external.sql b/tests/queries/1_stateful/00183_cross_join_external.sql
new file mode 100644
index 00000000000..346a473ff0b
--- /dev/null
+++ b/tests/queries/1_stateful/00183_cross_join_external.sql
@@ -0,0 +1,3 @@
+CREATE VIEW unit AS (SELECT 1);
+
+SELECT CounterID, StartURL FROM unit, test.visits ORDER BY (CounterID, StartURL) DESC LIMIT 1000 SETTINGS max_bytes_in_join=1, max_rows_in_join=1;
\ No newline at end of file

From 849dd825c57c1f155d6cd412186aeffa078ecb6c Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 9 May 2024 15:33:40 -0700
Subject: [PATCH 201/289] [Docs] Use ReplicatedMergeTree not
 ReplicatedReplacingMergeTree for data replication examples

---
 .../table-engines/mergetree-family/replication.md      | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/docs/en/engines/table-engines/mergetree-family/replication.md b/docs/en/engines/table-engines/mergetree-family/replication.md
index 822e2bc385f..65a5f58b166 100644
--- a/docs/en/engines/table-engines/mergetree-family/replication.md
+++ b/docs/en/engines/table-engines/mergetree-family/replication.md
@@ -10,7 +10,7 @@ sidebar_label: Data Replication
 In ClickHouse Cloud replication is managed for you. Please create your tables without adding arguments.  For example, in the text below you would replace:
 
 ```sql
-ENGINE = ReplicatedReplacingMergeTree(
+ENGINE = ReplicatedMergeTree(
     '/clickhouse/tables/{shard}/table_name',
     '{replica}',
     ver
@@ -20,7 +20,7 @@ ENGINE = ReplicatedReplacingMergeTree(
 with:
 
 ```sql
-ENGINE = ReplicatedReplacingMergeTree
+ENGINE = ReplicatedMergeTree
 ```
 :::
 
@@ -140,11 +140,11 @@ The system monitors data synchronicity on replicas and is able to recover after
 :::note
 In ClickHouse Cloud replication is managed for you. Please create your tables without adding arguments.  For example, in the text below you would replace:
 ```
-ENGINE = ReplicatedReplacingMergeTree('/clickhouse/tables/{shard}/table_name', '{replica}', ver)
+ENGINE = ReplicatedMergeTree('/clickhouse/tables/{shard}/table_name', '{replica}', ver)
 ```
 with:
 ```
-ENGINE = ReplicatedReplacingMergeTree
+ENGINE = ReplicatedMergeTree
 ```
 :::
 
@@ -177,7 +177,7 @@ CREATE TABLE table_name
     CounterID UInt32,
     UserID UInt32,
     ver UInt16
-) ENGINE = ReplicatedReplacingMergeTree('/clickhouse/tables/{shard}/table_name', '{replica}', ver)
+) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{shard}/table_name', '{replica}', ver)
 PARTITION BY toYYYYMM(EventDate)
 ORDER BY (CounterID, EventDate, intHash32(UserID))
 SAMPLE BY intHash32(UserID);

From c17a3bb9440f1f67222b53fb8a4676047e9d563d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 03:31:40 +0200
Subject: [PATCH 202/289] Useless changes

---
 .clang-tidy                                   |  1 +
 base/base/TypeList.h                          |  2 +-
 src/Access/AccessRights.cpp                   |  5 ++--
 src/Access/DiskAccessStorage.cpp              |  2 +-
 src/Access/LDAPClient.cpp                     |  2 +-
 src/Backups/BackupIO_File.cpp                 |  2 +-
 src/Common/Base58.cpp                         |  2 +-
 src/Common/FST.cpp                            |  4 ++++
 src/Core/MySQL/MySQLReplication.cpp           | 11 +++++----
 src/DataTypes/DataTypeNested.cpp              |  2 +-
 src/DataTypes/DataTypeVariant.cpp             |  6 +----
 src/DataTypes/FieldToDataType.cpp             |  3 +--
 .../SerializationAggregateFunction.cpp        |  4 +---
 .../Serializations/SerializationDateTime.cpp  | 13 ++++------
 .../Serializations/SerializationInfo.cpp      |  2 +-
 .../Serializations/SerializationUUID.cpp      |  1 -
 .../Serializations/SerializationVariant.cpp   | 15 ++++--------
 src/DataTypes/getLeastSupertype.cpp           |  7 ++----
 src/Databases/DatabaseAtomic.cpp              | 22 ++++++++++-------
 src/Databases/DatabaseMemory.cpp              |  4 ++--
 src/Databases/DatabaseOnDisk.cpp              | 24 +++++++++----------
 src/Databases/DatabaseOrdinary.cpp            |  4 ++--
 .../MySQL/DatabaseMaterializedMySQL.cpp       |  2 +-
 src/Databases/MySQL/DatabaseMySQL.cpp         |  4 ++--
 src/Databases/MySQL/MaterializeMetadata.cpp   |  2 +-
 src/Databases/TablesLoader.cpp                |  2 +-
 src/Disks/DiskLocal.cpp                       |  4 ++--
 src/QueryPipeline/QueryPipelineBuilder.cpp    |  3 +--
 .../Cache/ExternalDataSourceCache.cpp         |  3 +--
 29 files changed, 73 insertions(+), 85 deletions(-)

diff --git a/.clang-tidy b/.clang-tidy
index 2086f3202c5..19aa5b89141 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -131,6 +131,7 @@ Checks: [
   '-readability-redundant-member-init',
   '-bugprone-crtp-constructor-accessibility',
   '-bugprone-suspicious-stringview-data-usage',
+  '-bugprone-multi-level-implicit-pointer-conversion',
 
   '-zircon-*'
 ]
diff --git a/base/base/TypeList.h b/base/base/TypeList.h
index 310f0c0c586..ebbe1b48b29 100644
--- a/base/base/TypeList.h
+++ b/base/base/TypeList.h
@@ -27,7 +27,7 @@ namespace TypeListUtils /// In some contexts it's more handy to use functions in
     constexpr Root<Args...> changeRoot(TypeList<Args...>) { return {}; }
 
     template <typename F, typename ...Args>
-    constexpr void forEach(TypeList<Args...>, F && f) { (std::forward<F>(f)(TypeList<Args>{}), ...); }
+    constexpr void forEach(TypeList<Args...>, F && f) { (f(TypeList<Args>{}), ...); }
 }
 
 template <typename TypeListLeft, typename TypeListRight>
diff --git a/src/Access/AccessRights.cpp b/src/Access/AccessRights.cpp
index 09a610f5b85..c10931f554c 100644
--- a/src/Access/AccessRights.cpp
+++ b/src/Access/AccessRights.cpp
@@ -233,7 +233,7 @@ namespace
 
     /**
      *  Levels:
-     *                    1. GLOBAL
+     *  1. GLOBAL
      *  2. DATABASE_LEVEL          2. GLOBAL_WITH_PARAMETER (parameter example: named collection)
      *  3. TABLE_LEVEL
      *  4. COLUMN_LEVEL
@@ -246,6 +246,7 @@ namespace
         GLOBAL_WITH_PARAMETER = DATABASE_LEVEL,
         TABLE_LEVEL = 2,
         COLUMN_LEVEL = 3,
+        MAX = COLUMN_LEVEL,
     };
 
     AccessFlags getAllGrantableFlags(Level level)
@@ -520,7 +521,7 @@ public:
 
 private:
     AccessFlags getAllGrantableFlags() const { return ::DB::getAllGrantableFlags(level); }
-    AccessFlags getChildAllGrantableFlags() const { return ::DB::getAllGrantableFlags(static_cast<Level>(level + 1)); }
+    AccessFlags getChildAllGrantableFlags() const { return ::DB::getAllGrantableFlags(static_cast<Level>(level == Level::MAX ? level : (level + 1))); }
 
     Node * tryGetChild(std::string_view name) const
     {
diff --git a/src/Access/DiskAccessStorage.cpp b/src/Access/DiskAccessStorage.cpp
index 1b4b6c440b1..fe698b32816 100644
--- a/src/Access/DiskAccessStorage.cpp
+++ b/src/Access/DiskAccessStorage.cpp
@@ -574,7 +574,7 @@ bool DiskAccessStorage::insertNoLock(const UUID & id, const AccessEntityPtr & ne
             return true;
         }
 
-        removeNoLock(id, /* throw_if_not_exists= */ false, write_on_disk);
+        removeNoLock(id, /* throw_if_not_exists= */ false, write_on_disk); // NOLINT
     }
 
     /// Do insertion.
diff --git a/src/Access/LDAPClient.cpp b/src/Access/LDAPClient.cpp
index b32b1222829..3a0b82b9a76 100644
--- a/src/Access/LDAPClient.cpp
+++ b/src/Access/LDAPClient.cpp
@@ -196,7 +196,7 @@ void LDAPClient::handleError(int result_code, String text)
                 }
             });
 
-            ldap_get_option(handle, LDAP_OPT_DIAGNOSTIC_MESSAGE, static_cast<void*>(&raw_message));
+            ldap_get_option(handle, LDAP_OPT_DIAGNOSTIC_MESSAGE, &raw_message);
 
             if (raw_message && *raw_message != '\0')
             {
diff --git a/src/Backups/BackupIO_File.cpp b/src/Backups/BackupIO_File.cpp
index 39abd4fa906..13d52c448ac 100644
--- a/src/Backups/BackupIO_File.cpp
+++ b/src/Backups/BackupIO_File.cpp
@@ -107,7 +107,7 @@ void BackupWriterFile::removeFile(const String & file_name)
 {
     (void)fs::remove(root_path / file_name);
     if (fs::is_directory(root_path) && fs::is_empty(root_path))
-        fs::remove(root_path);
+        (void)fs::remove(root_path);
 }
 
 void BackupWriterFile::removeFiles(const Strings & file_names)
diff --git a/src/Common/Base58.cpp b/src/Common/Base58.cpp
index 082db626434..d9593a1377e 100644
--- a/src/Common/Base58.cpp
+++ b/src/Common/Base58.cpp
@@ -105,7 +105,7 @@ std::optional<size_t> decodeBase58(const UInt8 * src, size_t src_length, UInt8 *
         }
         for (size_t j = 0; j < idx; ++j)
         {
-            carry += static_cast<UInt8>(dst[j] * 58);
+            carry += dst[j] * 58;
             dst[j] = static_cast<UInt8>(carry & 0xFF);
             carry >>= 8;
         }
diff --git a/src/Common/FST.cpp b/src/Common/FST.cpp
index 9f4e2f1f9e0..9d30cdb1945 100644
--- a/src/Common/FST.cpp
+++ b/src/Common/FST.cpp
@@ -1,3 +1,5 @@
+// NOLINTBEGIN(clang-analyzer-optin.core.EnumCastOutOfRange)
+
 #include "FST.h"
 #include <algorithm>
 #include <cassert>
@@ -483,3 +485,5 @@ std::pair<UInt64, bool> FiniteStateTransducer::getOutput(std::string_view term)
 }
 
 }
+
+// NOLINTEND(clang-analyzer-optin.core.EnumCastOutOfRange)
diff --git a/src/Core/MySQL/MySQLReplication.cpp b/src/Core/MySQL/MySQLReplication.cpp
index 6e1ae87f25e..6f18ce8978d 100644
--- a/src/Core/MySQL/MySQLReplication.cpp
+++ b/src/Core/MySQL/MySQLReplication.cpp
@@ -580,7 +580,7 @@ namespace MySQLReplication
                     case MYSQL_TYPE_YEAR: {
                         Int16 val = 0;
                         payload.readStrict(reinterpret_cast<char *>(&val), 1);
-                        row.push_back(Field{UInt16{static_cast<UInt16>(val + 1900)}});
+                        row.push_back(Field{static_cast<UInt16>(val + 1900)});
                         break;
                     }
                     case MYSQL_TYPE_TIME2:
@@ -665,8 +665,9 @@ namespace MySQLReplication
 
                         Int64 time_micro = 0;
                         time_micro = (hh * 3600  + mm * 60 + ss) * 1000000 + std::abs(frac);
-                        if (negative) time_micro = - time_micro;
-                        row.push_back(Field{Int64{time_micro}});
+                        if (negative)
+                            time_micro = - time_micro;
+                        row.push_back(Field{time_micro});
                         break;
                     }
                     case MYSQL_TYPE_DATETIME2:
@@ -812,13 +813,13 @@ namespace MySQLReplication
                         {
                             UInt8 val = 0;
                             payload.readStrict(reinterpret_cast<char *>(&val), 1);
-                            row.push_back(Field{UInt8{val}});
+                            row.push_back(Field{val});
                         }
                         else
                         {
                             UInt16 val = 0;
                             payload.readStrict(reinterpret_cast<char *>(&val), 2);
-                            row.push_back(Field{UInt16{val}});
+                            row.push_back(Field{val});
                         }
                         break;
                     }
diff --git a/src/DataTypes/DataTypeNested.cpp b/src/DataTypes/DataTypeNested.cpp
index a4b7442393c..972eaa50693 100644
--- a/src/DataTypes/DataTypeNested.cpp
+++ b/src/DataTypes/DataTypeNested.cpp
@@ -61,7 +61,7 @@ static std::pair<DataTypePtr, DataTypeCustomDescPtr> create(const ASTPtr & argum
 
 void registerDataTypeNested(DataTypeFactory & factory)
 {
-    return factory.registerDataTypeCustom("Nested", create);
+    factory.registerDataTypeCustom("Nested", create);
 }
 
 DataTypePtr createNested(const DataTypes & types, const Names & names)
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index db96972c00f..5989da90937 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -151,11 +151,7 @@ size_t DataTypeVariant::getMaximumSizeOfValueInMemory() const
 {
     size_t max_size = 0;
     for (const auto & elem : variants)
-    {
-        size_t elem_max_size = elem->getMaximumSizeOfValueInMemory();
-        if (elem_max_size > max_size)
-            max_size = elem_max_size;
-    }
+        max_size = std::max(max_size, elem->getMaximumSizeOfValueInMemory());
     return max_size;
 }
 
diff --git a/src/DataTypes/FieldToDataType.cpp b/src/DataTypes/FieldToDataType.cpp
index a7b43e9e2c5..573c740c8f6 100644
--- a/src/DataTypes/FieldToDataType.cpp
+++ b/src/DataTypes/FieldToDataType.cpp
@@ -189,8 +189,7 @@ DataTypePtr FieldToDataType<on_error>::operator() (const Object &) const
 template <LeastSupertypeOnError on_error>
 DataTypePtr FieldToDataType<on_error>::operator() (const AggregateFunctionStateData & x) const
 {
-    const auto & name = static_cast<const AggregateFunctionStateData &>(x).name;
-    return DataTypeFactory::instance().get(name);
+    return DataTypeFactory::instance().get(x.name);
 }
 
 template <LeastSupertypeOnError on_error>
diff --git a/src/DataTypes/Serializations/SerializationAggregateFunction.cpp b/src/DataTypes/Serializations/SerializationAggregateFunction.cpp
index 640d2c419d4..bab7c1d4cf2 100644
--- a/src/DataTypes/Serializations/SerializationAggregateFunction.cpp
+++ b/src/DataTypes/Serializations/SerializationAggregateFunction.cpp
@@ -63,9 +63,7 @@ void SerializationAggregateFunction::serializeBinaryBulk(const IColumn & column,
     ColumnAggregateFunction::Container::const_iterator it = vec.begin() + offset;
     ColumnAggregateFunction::Container::const_iterator end = limit ? it + limit : vec.end();
 
-    if (end > vec.end())
-        end = vec.end();
-
+    end = std::min(end, vec.end());
     for (; it != end; ++it)
         function->serialize(*it, ostr, version);
 }
diff --git a/src/DataTypes/Serializations/SerializationDateTime.cpp b/src/DataTypes/Serializations/SerializationDateTime.cpp
index 17465d85e9d..c5c819ce7fa 100644
--- a/src/DataTypes/Serializations/SerializationDateTime.cpp
+++ b/src/DataTypes/Serializations/SerializationDateTime.cpp
@@ -31,15 +31,13 @@ inline void readText(time_t & x, ReadBuffer & istr, const FormatSettings & setti
             break;
     }
 
-    if (x < 0)
-        x = 0;
+    x = std::max<time_t>(0, x);
 }
 
 inline void readAsIntText(time_t & x, ReadBuffer & istr)
 {
     readIntText(x, istr);
-    if (x < 0)
-        x = 0;
+    x = std::max<time_t>(0, x);
 }
 
 inline bool tryReadText(time_t & x, ReadBuffer & istr, const FormatSettings & settings, const DateLUTImpl & time_zone, const DateLUTImpl & utc_time_zone)
@@ -58,9 +56,7 @@ inline bool tryReadText(time_t & x, ReadBuffer & istr, const FormatSettings & se
             break;
     }
 
-    if (x < 0)
-        x = 0;
-
+    x = std::max<time_t>(0, x);
     return res;
 }
 
@@ -68,8 +64,7 @@ inline bool tryReadAsIntText(time_t & x, ReadBuffer & istr)
 {
     if (!tryReadIntText(x, istr))
         return false;
-    if (x < 0)
-        x = 0;
+    x = std::max<time_t>(0, x);
     return true;
 }
 
diff --git a/src/DataTypes/Serializations/SerializationInfo.cpp b/src/DataTypes/Serializations/SerializationInfo.cpp
index 4e9b9905454..7d5c456af7f 100644
--- a/src/DataTypes/Serializations/SerializationInfo.cpp
+++ b/src/DataTypes/Serializations/SerializationInfo.cpp
@@ -243,7 +243,7 @@ void SerializationInfoByName::writeJSON(WriteBuffer & out) const
     oss.exceptions(std::ios::failbit);
     Poco::JSON::Stringifier::stringify(object, oss);
 
-    return writeString(oss.str(), out);
+    writeString(oss.str(), out);
 }
 
 SerializationInfoByName SerializationInfoByName::readJSON(
diff --git a/src/DataTypes/Serializations/SerializationUUID.cpp b/src/DataTypes/Serializations/SerializationUUID.cpp
index 5a7aeca67a0..58178a896dc 100644
--- a/src/DataTypes/Serializations/SerializationUUID.cpp
+++ b/src/DataTypes/Serializations/SerializationUUID.cpp
@@ -80,7 +80,6 @@ void SerializationUUID::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
 bool SerializationUUID::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     UUID uuid;
-    String field;
     if (!checkChar('\'', istr) || !tryReadText(uuid, istr) || !checkChar('\'', istr))
         return false;
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 8ca86c63bf6..300686ff8d3 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -494,10 +494,8 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
         {
             auto [elem_nested_depth, elem_priority, elem_simple_nested_depth] = getTypeTextDeserializePriority(elem, nested_depth + 1, simple_nested_depth, priority_map);
             sum_priority += elem_priority;
-            if (elem_nested_depth > max_nested_depth)
-                max_nested_depth = elem_nested_depth;
-            if (elem_simple_nested_depth > max_simple_nested_depth)
-                max_simple_nested_depth = elem_simple_nested_depth;
+            max_nested_depth = std::max(elem_nested_depth, max_nested_depth);
+            max_simple_nested_depth = std::max(elem_simple_nested_depth, max_simple_nested_depth);
         }
 
         return {max_nested_depth, sum_priority + priority_map.at(TypeIndex::Tuple), max_simple_nested_depth};
@@ -518,12 +516,9 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
         for (const auto & variant : variant_type->getVariants())
         {
             auto [variant_max_depth, variant_priority, variant_simple_nested_depth] = getTypeTextDeserializePriority(variant, nested_depth, simple_nested_depth, priority_map);
-            if (variant_priority > max_priority)
-                max_priority = variant_priority;
-            if (variant_max_depth > max_depth)
-                max_depth = variant_max_depth;
-            if (variant_simple_nested_depth > max_simple_nested_depth)
-                max_simple_nested_depth = variant_simple_nested_depth;
+            max_priority = std::max(variant_priority, max_priority);
+            max_depth = std::max(variant_max_depth, max_depth);
+            max_simple_nested_depth = std::max(variant_simple_nested_depth, max_simple_nested_depth);
         }
 
         return {max_depth, max_priority, max_simple_nested_depth};
diff --git a/src/DataTypes/getLeastSupertype.cpp b/src/DataTypes/getLeastSupertype.cpp
index e69b0411aac..0977bea362c 100644
--- a/src/DataTypes/getLeastSupertype.cpp
+++ b/src/DataTypes/getLeastSupertype.cpp
@@ -79,8 +79,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
 
     auto maximize = [](size_t & what, size_t value)
     {
-        if (value > what)
-            what = value;
+        what = std::max(value, what);
     };
 
     for (const auto & type : types)
@@ -596,9 +595,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
                     continue;
                 }
 
-                UInt32 scale = getDecimalScale(*type);
-                if (scale > max_scale)
-                    max_scale = scale;
+                max_scale = std::max(max_scale, getDecimalScale(*type));
             }
 
             UInt32 min_precision = max_scale + leastDecimalPrecisionFor(max_int);
diff --git a/src/Databases/DatabaseAtomic.cpp b/src/Databases/DatabaseAtomic.cpp
index ada06e3b035..8edc5b737a6 100644
--- a/src/Databases/DatabaseAtomic.cpp
+++ b/src/Databases/DatabaseAtomic.cpp
@@ -81,14 +81,14 @@ void DatabaseAtomic::drop(ContextPtr)
     assert(TSA_SUPPRESS_WARNING_FOR_READ(tables).empty());
     try
     {
-        fs::remove(path_to_metadata_symlink);
-        fs::remove_all(path_to_table_symlinks);
+        (void)fs::remove(path_to_metadata_symlink);
+        (void)fs::remove_all(path_to_table_symlinks);
     }
     catch (...)
     {
         LOG_WARNING(log, getCurrentExceptionMessageAndPattern(/* with_stacktrace */ true));
     }
-    fs::remove_all(getMetadataPath());
+    (void)fs::remove_all(getMetadataPath());
 }
 
 void DatabaseAtomic::attachTable(ContextPtr /* context_ */, const String & name, const StoragePtr & table, const String & relative_table_path)
@@ -335,7 +335,7 @@ void DatabaseAtomic::commitCreateTable(const ASTCreateQuery & query, const Stora
     }
     catch (...)
     {
-        fs::remove(table_metadata_tmp_path);
+        (void)fs::remove(table_metadata_tmp_path);
         throw;
     }
     if (table->storesDataOnDisk())
@@ -346,7 +346,11 @@ void DatabaseAtomic::commitAlterTable(const StorageID & table_id, const String &
                                       const String & /*statement*/, ContextPtr query_context)
 {
     bool check_file_exists = true;
-    SCOPE_EXIT({ std::error_code code; if (check_file_exists) std::filesystem::remove(table_metadata_tmp_path, code); });
+    SCOPE_EXIT({
+        std::error_code code;
+        if (check_file_exists)
+            (void)std::filesystem::remove(table_metadata_tmp_path, code);
+    });
 
     std::lock_guard lock{mutex};
     auto actual_table_id = getTableUnlocked(table_id.table_name)->getStorageID();
@@ -447,7 +451,7 @@ void DatabaseAtomic::beforeLoadingMetadata(ContextMutablePtr /*context*/, Loadin
                 "'{}' is not a symlink. Atomic database should contains only symlinks.", std::string(table_path.path()));
         }
 
-        fs::remove(table_path);
+        (void)fs::remove(table_path);
     }
 }
 
@@ -526,7 +530,7 @@ void DatabaseAtomic::tryRemoveSymlink(const String & table_name)
     try
     {
         String path = path_to_table_symlinks + escapeForFileName(table_name);
-        fs::remove(path);
+        (void)fs::remove(path);
     }
     catch (...)
     {
@@ -551,7 +555,7 @@ void DatabaseAtomic::tryCreateMetadataSymlink()
         {
             /// fs::exists could return false for broken symlink
             if (FS::isSymlinkNoThrow(metadata_symlink))
-                fs::remove(metadata_symlink);
+                (void)fs::remove(metadata_symlink);
             fs::create_directory_symlink(metadata_path, path_to_metadata_symlink);
         }
         catch (...)
@@ -578,7 +582,7 @@ void DatabaseAtomic::renameDatabase(ContextPtr query_context, const String & new
 
     try
     {
-        fs::remove(path_to_metadata_symlink);
+        (void)fs::remove(path_to_metadata_symlink);
     }
     catch (...)
     {
diff --git a/src/Databases/DatabaseMemory.cpp b/src/Databases/DatabaseMemory.cpp
index 4ff7b3c7f2b..b82cf885b4a 100644
--- a/src/Databases/DatabaseMemory.cpp
+++ b/src/Databases/DatabaseMemory.cpp
@@ -79,7 +79,7 @@ void DatabaseMemory::dropTable(
         {
             fs::path table_data_dir{fs::path{getContext()->getPath()} / getTableDataPath(table_name)};
             if (fs::exists(table_data_dir))
-                fs::remove_all(table_data_dir);
+                (void)fs::remove_all(table_data_dir);
         }
     }
     catch (...)
@@ -135,7 +135,7 @@ UUID DatabaseMemory::tryGetTableUUID(const String & table_name) const
 
 void DatabaseMemory::removeDataPath(ContextPtr local_context)
 {
-    std::filesystem::remove_all(local_context->getPath() + data_path);
+    (void)std::filesystem::remove_all(local_context->getPath() + data_path);
 }
 
 void DatabaseMemory::drop(ContextPtr local_context)
diff --git a/src/Databases/DatabaseOnDisk.cpp b/src/Databases/DatabaseOnDisk.cpp
index 674e9afa8ac..67b45c7d08d 100644
--- a/src/Databases/DatabaseOnDisk.cpp
+++ b/src/Databases/DatabaseOnDisk.cpp
@@ -265,7 +265,7 @@ void DatabaseOnDisk::removeDetachedPermanentlyFlag(ContextPtr, const String & ta
         fs::path detached_permanently_flag(table_metadata_path + detached_suffix);
 
         if (fs::exists(detached_permanently_flag))
-            fs::remove(detached_permanently_flag);
+            (void)fs::remove(detached_permanently_flag);
     }
     catch (Exception & e)
     {
@@ -289,7 +289,7 @@ void DatabaseOnDisk::commitCreateTable(const ASTCreateQuery & query, const Stora
     }
     catch (...)
     {
-        fs::remove(table_metadata_tmp_path);
+        (void)fs::remove(table_metadata_tmp_path);
         throw;
     }
 }
@@ -338,7 +338,7 @@ void DatabaseOnDisk::dropTable(ContextPtr local_context, const String & table_na
 
         fs::path table_data_dir(local_context->getPath() + table_data_path_relative);
         if (fs::exists(table_data_dir))
-            fs::remove_all(table_data_dir);
+            (void)fs::remove_all(table_data_dir);
     }
     catch (...)
     {
@@ -349,7 +349,7 @@ void DatabaseOnDisk::dropTable(ContextPtr local_context, const String & table_na
         throw;
     }
 
-    fs::remove(table_metadata_path_drop);
+    (void)fs::remove(table_metadata_path_drop);
 }
 
 void DatabaseOnDisk::checkMetadataFilenameAvailability(const String & to_table_name) const
@@ -468,7 +468,7 @@ void DatabaseOnDisk::renameTable(
     /// Now table data are moved to new database, so we must add metadata and attach table to new database
     to_database.createTable(local_context, to_table_name, table, attach_query);
 
-    fs::remove(table_metadata_path);
+    (void)fs::remove(table_metadata_path);
 
     if (from_atomic_to_ordinary)
     {
@@ -548,15 +548,15 @@ void DatabaseOnDisk::drop(ContextPtr local_context)
     assert(TSA_SUPPRESS_WARNING_FOR_READ(tables).empty());
     if (local_context->getSettingsRef().force_remove_data_recursively_on_drop)
     {
-        fs::remove_all(local_context->getPath() + getDataPath());
-        fs::remove_all(getMetadataPath());
+        (void)fs::remove_all(local_context->getPath() + getDataPath());
+        (void)fs::remove_all(getMetadataPath());
     }
     else
     {
         try
         {
-            fs::remove(local_context->getPath() + getDataPath());
-            fs::remove(getMetadataPath());
+            (void)fs::remove(local_context->getPath() + getDataPath());
+            (void)fs::remove(getMetadataPath());
         }
         catch (const fs::filesystem_error & e)
         {
@@ -610,7 +610,7 @@ void DatabaseOnDisk::iterateMetadataFiles(ContextPtr local_context, const Iterat
         else
         {
             LOG_INFO(log, "Removing file {}", getMetadataPath() + file_name);
-            fs::remove(getMetadataPath() + file_name);
+            (void)fs::remove(getMetadataPath() + file_name);
         }
     };
 
@@ -642,7 +642,7 @@ void DatabaseOnDisk::iterateMetadataFiles(ContextPtr local_context, const Iterat
         {
             /// There are files .sql.tmp - delete
             LOG_INFO(log, "Removing file {}", dir_it->path().string());
-            fs::remove(dir_it->path());
+            (void)fs::remove(dir_it->path());
         }
         else if (endsWith(file_name, ".sql"))
         {
@@ -708,7 +708,7 @@ ASTPtr DatabaseOnDisk::parseQueryFromMetadata(
     {
         if (logger)
             LOG_ERROR(logger, "File {} is empty. Removing.", metadata_file_path);
-        fs::remove(metadata_file_path);
+        (void)fs::remove(metadata_file_path);
         return nullptr;
     }
 
diff --git a/src/Databases/DatabaseOrdinary.cpp b/src/Databases/DatabaseOrdinary.cpp
index d571fe4491d..5d36f1cc3d6 100644
--- a/src/Databases/DatabaseOrdinary.cpp
+++ b/src/Databases/DatabaseOrdinary.cpp
@@ -304,7 +304,7 @@ void DatabaseOrdinary::restoreMetadataAfterConvertingToReplicated(StoragePtr tab
     if (!fs::exists(convert_to_replicated_flag_path))
         return;
 
-    fs::remove(convert_to_replicated_flag_path);
+    (void)fs::remove(convert_to_replicated_flag_path);
     LOG_INFO
     (
         log,
@@ -540,7 +540,7 @@ void DatabaseOrdinary::commitAlterTable(const StorageID &, const String & table_
     }
     catch (...)
     {
-        fs::remove(table_metadata_tmp_path);
+        (void)fs::remove(table_metadata_tmp_path);
         throw;
     }
 }
diff --git a/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp b/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
index d8360a24bcb..9b6b0f33d95 100644
--- a/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
+++ b/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
@@ -169,7 +169,7 @@ void DatabaseMaterializedMySQL::drop(ContextPtr context_)
     fs::path metadata(getMetadataPath() + "/.metadata");
 
     if (fs::exists(metadata))
-        fs::remove(metadata);
+        (void)fs::remove(metadata);
 
     DatabaseAtomic::drop(context_);
 }
diff --git a/src/Databases/MySQL/DatabaseMySQL.cpp b/src/Databases/MySQL/DatabaseMySQL.cpp
index b2e199735db..84dd385e191 100644
--- a/src/Databases/MySQL/DatabaseMySQL.cpp
+++ b/src/Databases/MySQL/DatabaseMySQL.cpp
@@ -341,7 +341,7 @@ void DatabaseMySQL::shutdown()
 
 void DatabaseMySQL::drop(ContextPtr /*context*/)
 {
-    fs::remove_all(getMetadataPath());
+    (void)fs::remove_all(getMetadataPath());
 }
 
 void DatabaseMySQL::cleanOutdatedTables()
@@ -390,7 +390,7 @@ void DatabaseMySQL::attachTable(ContextPtr /* context_ */, const String & table_
     fs::path remove_flag = fs::path(getMetadataPath()) / (escapeForFileName(table_name) + suffix);
 
     if (fs::exists(remove_flag))
-        fs::remove(remove_flag);
+        (void)fs::remove(remove_flag);
 }
 
 StoragePtr DatabaseMySQL::detachTable(ContextPtr /* context */, const String & table_name)
diff --git a/src/Databases/MySQL/MaterializeMetadata.cpp b/src/Databases/MySQL/MaterializeMetadata.cpp
index c7895554077..b187b2904f2 100644
--- a/src/Databases/MySQL/MaterializeMetadata.cpp
+++ b/src/Databases/MySQL/MaterializeMetadata.cpp
@@ -228,7 +228,7 @@ void commitMetadata(Fn<void()> auto && function, const String & persistent_tmp_p
     }
     catch (...)
     {
-        fs::remove(persistent_tmp_path);
+        (void)fs::remove(persistent_tmp_path);
         throw;
     }
 }
diff --git a/src/Databases/TablesLoader.cpp b/src/Databases/TablesLoader.cpp
index 48745ff91c2..6aa13b7b759 100644
--- a/src/Databases/TablesLoader.cpp
+++ b/src/Databases/TablesLoader.cpp
@@ -199,7 +199,7 @@ void TablesLoader::removeUnresolvableDependencies()
         return true; /// Exclude this dependency.
     };
 
-    all_loading_dependencies.removeTablesIf(need_exclude_dependency);
+    all_loading_dependencies.removeTablesIf(need_exclude_dependency); // NOLINT
 
     if (all_loading_dependencies.getNumberOfTables() != metadata.parsed_tables.size())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Number of tables to be loaded is not as expected. It's a bug");
diff --git a/src/Disks/DiskLocal.cpp b/src/Disks/DiskLocal.cpp
index e5cde775f79..d1f0a928b1d 100644
--- a/src/Disks/DiskLocal.cpp
+++ b/src/Disks/DiskLocal.cpp
@@ -297,7 +297,7 @@ void DiskLocal::createDirectories(const String & path)
 void DiskLocal::clearDirectory(const String & path)
 {
     for (const auto & entry : fs::directory_iterator(fs::path(disk_path) / path))
-        fs::remove(entry.path());
+        (void)fs::remove(entry.path());
 }
 
 void DiskLocal::moveDirectory(const String & from_path, const String & to_path)
@@ -377,7 +377,7 @@ void DiskLocal::removeDirectory(const String & path)
 
 void DiskLocal::removeRecursive(const String & path)
 {
-    fs::remove_all(fs::path(disk_path) / path);
+    (void)fs::remove_all(fs::path(disk_path) / path);
 }
 
 void DiskLocal::listFiles(const String & path, std::vector<String> & file_names) const
diff --git a/src/QueryPipeline/QueryPipelineBuilder.cpp b/src/QueryPipeline/QueryPipelineBuilder.cpp
index 67a8fe5dcab..803d1686ad7 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.cpp
+++ b/src/QueryPipeline/QueryPipelineBuilder.cpp
@@ -298,8 +298,7 @@ QueryPipelineBuilder QueryPipelineBuilder::unitePipelines(
 
         /// If one of pipelines uses more threads then current limit, will keep it.
         /// It may happen if max_distributed_connections > max_threads
-        if (pipeline.max_threads > max_threads_limit)
-            max_threads_limit = pipeline.max_threads;
+        max_threads_limit = std::max(pipeline.max_threads, max_threads_limit);
 
         concurrency_control = pipeline.getConcurrencyControl();
     }
diff --git a/src/Storages/Cache/ExternalDataSourceCache.cpp b/src/Storages/Cache/ExternalDataSourceCache.cpp
index c0277d0cbbb..cffb1dc9ca3 100644
--- a/src/Storages/Cache/ExternalDataSourceCache.cpp
+++ b/src/Storages/Cache/ExternalDataSourceCache.cpp
@@ -74,7 +74,6 @@ std::unique_ptr<ReadBuffer> RemoteReadBuffer::create(
     bool is_random_accessed)
 
 {
-    auto remote_path = remote_file_metadata->remote_path;
     auto remote_read_buffer = std::make_unique<RemoteReadBuffer>(buff_size);
 
     std::tie(remote_read_buffer->local_file_holder, read_buffer)
@@ -205,7 +204,7 @@ void ExternalDataSourceCache::recoverTask()
         }
     }
     for (auto & path : invalid_paths)
-        fs::remove_all(path);
+        (void)fs::remove_all(path);
     initialized = true;
 
     auto root_dirs_to_string = [&]()

From d2af8b5e2388cf91ea014e1b5b88a843efded4bf Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 10 May 2024 10:29:53 +0800
Subject: [PATCH 203/289] change as request

---
 src/Common/UTF8Helpers.cpp  | 24 ++++++++++--------------
 src/Functions/padString.cpp | 19 ++++++++++---------
 src/Functions/trim.cpp      |  2 +-
 3 files changed, 21 insertions(+), 24 deletions(-)

diff --git a/src/Common/UTF8Helpers.cpp b/src/Common/UTF8Helpers.cpp
index 6e1c3f5397b..1d4685470ab 100644
--- a/src/Common/UTF8Helpers.cpp
+++ b/src/Common/UTF8Helpers.cpp
@@ -224,15 +224,13 @@ DECLARE_SSE42_SPECIFIC_CODE(
 /// Copy from https://github.com/lemire/fastvalidate-utf-8/blob/master/include/simdasciicheck.h
 bool isAllASCII(const UInt8 * data, size_t size)
 {
-    size_t i = 0;
     __m128i masks = _mm_setzero_si128();
-    if (size >= 16)
+
+    size_t i = 0;
+    for (; i + 16 <= size; i += 16)
     {
-        for (; i <= size - 16; i += 16)
-        {
-            __m128i bytes = _mm_loadu_si128(reinterpret_cast<const __m128i *>(data + i));
-            masks = _mm_or_si128(masks, bytes);
-        }
+        __m128i bytes = _mm_loadu_si128(reinterpret_cast<const __m128i *>(data + i));
+        masks = _mm_or_si128(masks, bytes);
     }
     int mask = _mm_movemask_epi8(masks);
 
@@ -247,15 +245,13 @@ bool isAllASCII(const UInt8 * data, size_t size)
 DECLARE_AVX2_SPECIFIC_CODE(
 bool isAllASCII(const UInt8 * data, size_t size)
 {
-    size_t i = 0;
     __m256i masks = _mm256_setzero_si256();
-    if (size >= 32)
+
+    size_t i = 0;
+    for (; i + 32 <= size; i += 32)
     {
-        for (; i <= size - 32; i += 32)
-        {
-            __m256i bytes = _mm256_loadu_si256(reinterpret_cast<const __m256i*>(data + i));
-            masks = _mm256_or_si256(masks, bytes);
-        }
+        __m256i bytes = _mm256_loadu_si256(reinterpret_cast<const __m256i *>(data + i));
+        masks = _mm256_or_si256(masks, bytes);
     }
     int mask = _mm256_movemask_epi8(masks);
 
diff --git a/src/Functions/padString.cpp b/src/Functions/padString.cpp
index 119baaec723..da04f99bee9 100644
--- a/src/Functions/padString.cpp
+++ b/src/Functions/padString.cpp
@@ -240,34 +240,35 @@ namespace
             const auto & chars = strings.getElements();
             bool all_ascii = UTF8::isAllASCII(reinterpret_cast<const UInt8 *>(pad_string.data()), pad_string.size())
                 && UTF8::isAllASCII(chars.data(), chars.size());
+            bool is_actually_utf8 = is_utf8 && !all_ascii;
 
-            if (!is_utf8 || all_ascii)
+            if (!is_actually_utf8)
             {
                 PaddingChars<false> padding_chars{pad_string};
                 if (const auto * col_const = checkAndGetColumn<ColumnConst>(column_length.get()))
-                    executeForSourceAndLength<true>(
+                    executeForSourceAndLength<false>(
                         std::forward<SourceStrings>(strings), ConstSource<GenericValueSource>{*col_const}, padding_chars, res_sink);
                 else
-                    executeForSourceAndLength<true>(
+                    executeForSourceAndLength<false>(
                         std::forward<SourceStrings>(strings), GenericValueSource{*column_length}, padding_chars, res_sink);
             }
             else
             {
                 PaddingChars<true> padding_chars{pad_string};
                 if (const auto * col_const = checkAndGetColumn<ColumnConst>(column_length.get()))
-                    executeForSourceAndLength<false>(
+                    executeForSourceAndLength<true>(
                         std::forward<SourceStrings>(strings), ConstSource<GenericValueSource>{*col_const}, padding_chars, res_sink);
                 else
-                    executeForSourceAndLength<false>(
+                    executeForSourceAndLength<true>(
                         std::forward<SourceStrings>(strings), GenericValueSource{*column_length}, padding_chars, res_sink);
             }
         }
 
-        template <bool all_ascii, typename SourceStrings, typename SourceLengths>
+        template <bool is_actually_utf8, typename SourceStrings, typename SourceLengths>
         void executeForSourceAndLength(
             SourceStrings && strings,
             SourceLengths && lengths,
-            const PaddingChars<!all_ascii> & padding_chars,
+            const PaddingChars<is_actually_utf8> & padding_chars,
             StringSink & res_sink) const
         {
             bool is_const_new_length = lengths.isConst();
@@ -279,7 +280,7 @@ namespace
             for (; !res_sink.isEnd(); res_sink.next(), strings.next(), lengths.next())
             {
                 auto str = strings.getWhole();
-                ssize_t current_length = getLengthOfSlice<!all_ascii>(str);
+                ssize_t current_length = getLengthOfSlice<is_actually_utf8>(str);
 
                 if (!res_sink.rowNum() || !is_const_new_length)
                 {
@@ -309,7 +310,7 @@ namespace
                 }
                 else if (new_length < current_length)
                 {
-                    str = removeSuffixFromSlice<!all_ascii>(str, current_length - new_length);
+                    str = removeSuffixFromSlice<is_actually_utf8>(str, current_length - new_length);
                     writeSlice(str, res_sink);
                 }
                 else if (new_length > current_length)
diff --git a/src/Functions/trim.cpp b/src/Functions/trim.cpp
index 8b3d2870260..1f0011b8e99 100644
--- a/src/Functions/trim.cpp
+++ b/src/Functions/trim.cpp
@@ -59,7 +59,7 @@ public:
         {
             execute(reinterpret_cast<const UInt8 *>(&data[prev_offset]), offsets[i] - prev_offset - 1, start, length);
 
-            res_data.resize_exact(res_data.size() + length + 1);
+            res_data.resize(res_data.size() + length + 1);
             memcpySmallAllowReadWriteOverflow15(&res_data[res_offset], start, length);
             res_offset += length + 1;
             res_data[res_offset - 1] = '\0';

From 3de1fc674f6cdffc74c02a5e2d0e2ffffc221002 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Thu, 9 May 2024 23:57:42 +0000
Subject: [PATCH 204/289] Fix logical error in ColumnTuple::tryInsert()

---
 src/Columns/ColumnTuple.cpp                                     | 2 +-
 tests/queries/0_stateless/03149_variant_pop_back_typo.reference | 1 +
 tests/queries/0_stateless/03149_variant_pop_back_typo.sql       | 1 +
 3 files changed, 3 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03149_variant_pop_back_typo.reference
 create mode 100644 tests/queries/0_stateless/03149_variant_pop_back_typo.sql

diff --git a/src/Columns/ColumnTuple.cpp b/src/Columns/ColumnTuple.cpp
index 062bdadf9d2..2393fcf92fd 100644
--- a/src/Columns/ColumnTuple.cpp
+++ b/src/Columns/ColumnTuple.cpp
@@ -164,7 +164,7 @@ bool ColumnTuple::tryInsert(const Field & x)
         if (!columns[i]->tryInsert(tuple[i]))
         {
             for (size_t j = 0; j != i; ++j)
-                columns[i]->popBack(1);
+                columns[j]->popBack(1);
 
             return false;
         }
diff --git a/tests/queries/0_stateless/03149_variant_pop_back_typo.reference b/tests/queries/0_stateless/03149_variant_pop_back_typo.reference
new file mode 100644
index 00000000000..d60a254418f
--- /dev/null
+++ b/tests/queries/0_stateless/03149_variant_pop_back_typo.reference
@@ -0,0 +1 @@
+[{1:[],'':1},{'':1,1:'',1:1}]
diff --git a/tests/queries/0_stateless/03149_variant_pop_back_typo.sql b/tests/queries/0_stateless/03149_variant_pop_back_typo.sql
new file mode 100644
index 00000000000..c35a7b708c6
--- /dev/null
+++ b/tests/queries/0_stateless/03149_variant_pop_back_typo.sql
@@ -0,0 +1 @@
+select [map(1, [], '', 1), map('', 1, 1, '', toUInt128(1), 1)] settings allow_experimental_variant_type=1, use_variant_as_common_type=1
\ No newline at end of file

From 426a51b624e03692ac418654c37b24e19e3f5d88 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 04:53:29 +0200
Subject: [PATCH 205/289] Useless changes

---
 .clang-tidy                                   |   1 +
 base/base/constexpr_helpers.h                 |   2 +-
 src/Access/Common/AccessRightsElement.cpp     |   2 +-
 src/Access/Common/AllowedClientHosts.cpp      |  10 +-
 src/Access/IAccessStorage.cpp                 |   2 +-
 src/Access/ReplicatedAccessStorage.cpp        |   2 +-
 src/Access/SettingsConstraints.cpp            |   4 +-
 src/Analyzer/Passes/QueryAnalysisPass.cpp     |   3 +-
 src/Analyzer/QueryTreePassManager.cpp         |   4 +-
 src/BridgeHelper/XDBCBridgeHelper.h           |   2 +-
 src/Client/ClientBase.cpp                     |   4 +-
 src/Columns/ColumnSparse.cpp                  |   4 +-
 src/Common/MortonUtils.h                      |   4 +-
 src/Common/NetException.h                     |   2 +-
 src/Formats/JSONUtils.cpp                     |   5 +-
 src/Functions/FunctionsExternalDictionaries.h |   2 +-
 .../Access/InterpreterGrantQuery.cpp          |   2 +-
 src/Interpreters/ActionsDAG.cpp               |   2 +-
 src/Interpreters/Aggregator.cpp               |   8 +-
 src/Interpreters/Cache/FileCache.cpp          |   2 +-
 src/Interpreters/Cluster.cpp                  |   4 +-
 src/Interpreters/Context.cpp                  |  16 +--
 src/Interpreters/DDLWorker.cpp                |   1 -
 src/Interpreters/DatabaseCatalog.cpp          |   2 +-
 src/Interpreters/ExpressionAnalyzer.cpp       |   4 +-
 src/Interpreters/GinFilter.cpp                |   4 +
 src/Interpreters/GraceHashJoin.cpp            |   2 +-
 src/Interpreters/IExternalLoadable.cpp        |   6 +-
 src/Interpreters/ITokenExtractor.h            |   4 +-
 src/Interpreters/MutationsInterpreter.cpp     |   3 +-
 .../RewriteCountDistinctVisitor.cpp           |   1 -
 .../ServerAsynchronousMetrics.cpp             |   2 +-
 src/Interpreters/TreeOptimizer.cpp            |   7 +-
 src/Parsers/ASTBackupQuery.cpp                |   2 +-
 src/Parsers/Access/ParserGrantQuery.cpp       |   2 +-
 src/Parsers/ParserBackupQuery.cpp             |   2 +-
 src/Parsers/makeASTForLogicalFunction.cpp     |   4 +-
 src/Server/GRPCServer.cpp                     |   2 +-
 src/Server/TCPHandler.cpp                     |   2 +-
 src/Storages/AlterCommands.cpp                |   4 +-
 src/Storages/Distributed/DistributedSink.cpp  |   5 +-
 src/Storages/MaterializedView/RefreshSet.cpp  |   2 +-
 src/Storages/MergeTree/GinIndexStore.cpp      |   4 +
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |   1 -
 src/Storages/MergeTree/KeyCondition.cpp       |   3 +-
 src/Storages/MergeTree/LevelMergeSelector.cpp | 118 ------------------
 src/Storages/MergeTree/LevelMergeSelector.h   |  30 -----
 src/Storages/MergeTree/MergeTask.cpp          |   2 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |   2 +-
 src/Storages/MergeTree/MergeTreePartition.cpp |   2 +-
 .../MergeTree/MergeTreeRangeReader.cpp        |   9 +-
 src/Storages/MergeTree/MergeTreeReadPool.cpp  |   3 +-
 .../ParallelReplicasReadingCoordinator.cpp    |   2 +-
 .../ReplicatedMergeTreeCleanupThread.cpp      |   5 +-
 .../MergeTree/ReplicatedMergeTreeLogEntry.cpp |   2 +-
 .../MergeTree/ReplicatedMergeTreeSink.cpp     |   2 +-
 src/Storages/PartitionedSink.cpp              |   4 +
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp |   8 +-
 src/Storages/S3Queue/StorageS3Queue.cpp       |   9 +-
 src/Storages/StorageBuffer.cpp                |   2 +-
 src/Storages/StorageDistributed.cpp           |   3 +-
 src/Storages/StorageFuzzJSON.cpp              |   2 +-
 src/Storages/StorageKeeperMap.cpp             |   4 +-
 src/Storages/StorageLog.cpp                   |   3 +-
 src/Storages/StorageMaterializedView.cpp      |   2 +-
 src/Storages/StorageMerge.cpp                 |   4 +-
 src/Storages/StorageMongoDB.cpp               |   2 +-
 src/Storages/StorageReplicatedMergeTree.cpp   |  30 ++---
 src/Storages/StorageS3.cpp                    |  14 +--
 src/Storages/StorageStripeLog.cpp             |   3 +-
 src/Storages/StorageURL.cpp                   |   3 +-
 src/Storages/WindowView/StorageWindowView.cpp |  11 +-
 src/Storages/registerStorages.cpp             |   4 -
 73 files changed, 132 insertions(+), 309 deletions(-)
 delete mode 100644 src/Storages/MergeTree/LevelMergeSelector.cpp
 delete mode 100644 src/Storages/MergeTree/LevelMergeSelector.h

diff --git a/.clang-tidy b/.clang-tidy
index 19aa5b89141..d4e326adcc5 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -132,6 +132,7 @@ Checks: [
   '-bugprone-crtp-constructor-accessibility',
   '-bugprone-suspicious-stringview-data-usage',
   '-bugprone-multi-level-implicit-pointer-conversion',
+  '-cert-err33-c',
 
   '-zircon-*'
 ]
diff --git a/base/base/constexpr_helpers.h b/base/base/constexpr_helpers.h
index 2dad106a7a3..13bb5d85a56 100644
--- a/base/base/constexpr_helpers.h
+++ b/base/base/constexpr_helpers.h
@@ -21,7 +21,7 @@ bool func_wrapper(Func && func, Arg && arg)
 template <typename T, T Begin, typename Func, T... Is>
 constexpr bool static_for_impl(Func && f, std::integer_sequence<T, Is...>)
 {
-    return (func_wrapper(std::forward<Func>(f), std::integral_constant<T, Begin + Is>{}) || ...);
+    return (func_wrapper(f, std::integral_constant<T, Begin + Is>{}) || ...);
 }
 
 template <auto Begin, decltype(Begin) End, typename Func>
diff --git a/src/Access/Common/AccessRightsElement.cpp b/src/Access/Common/AccessRightsElement.cpp
index 8d54265ec39..24ff4e7631b 100644
--- a/src/Access/Common/AccessRightsElement.cpp
+++ b/src/Access/Common/AccessRightsElement.cpp
@@ -245,7 +245,7 @@ bool AccessRightsElements::sameOptions() const
 
 void AccessRightsElements::eraseNonGrantable()
 {
-    boost::range::remove_erase_if(*this, [](AccessRightsElement & element) // NOLINT
+    std::erase_if(*this, [](AccessRightsElement & element)
     {
         element.eraseNonGrantable();
         return element.empty();
diff --git a/src/Access/Common/AllowedClientHosts.cpp b/src/Access/Common/AllowedClientHosts.cpp
index d5e2200811e..2875f65579e 100644
--- a/src/Access/Common/AllowedClientHosts.cpp
+++ b/src/Access/Common/AllowedClientHosts.cpp
@@ -308,7 +308,7 @@ void AllowedClientHosts::removeAddress(const IPAddress & address)
     if (address.isLoopback())
         local_host = false;
     else
-        boost::range::remove_erase(addresses, address); // NOLINT
+        std::erase(addresses, address);
 }
 
 void AllowedClientHosts::addSubnet(const IPSubnet & subnet)
@@ -328,7 +328,7 @@ void AllowedClientHosts::removeSubnet(const IPSubnet & subnet)
     else if (subnet.isMaskAllBitsOne())
         removeAddress(subnet.getPrefix());
     else
-        boost::range::remove_erase(subnets, subnet); // NOLINT
+        std::erase(subnets, subnet);
 }
 
 void AllowedClientHosts::addName(const String & name)
@@ -344,7 +344,7 @@ void AllowedClientHosts::removeName(const String & name)
     if (boost::iequals(name, "localhost"))
         local_host = false;
     else
-        boost::range::remove_erase(names, name); // NOLINT
+        std::erase(names, name);
 }
 
 void AllowedClientHosts::addNameRegexp(const String & name_regexp)
@@ -364,7 +364,7 @@ void AllowedClientHosts::removeNameRegexp(const String & name_regexp)
     else if (name_regexp == ".*")
         any_host = false;
     else
-        boost::range::remove_erase(name_regexps, name_regexp); // NOLINT
+        std::erase(name_regexps, name_regexp);
 }
 
 void AllowedClientHosts::addLikePattern(const String & pattern)
@@ -384,7 +384,7 @@ void AllowedClientHosts::removeLikePattern(const String & pattern)
     else if ((pattern == "%") || (pattern == "0.0.0.0/0") || (pattern == "::/0"))
         any_host = false;
     else
-        boost::range::remove_erase(like_patterns, pattern); // NOLINT
+        std::erase(like_patterns, pattern);
 }
 
 void AllowedClientHosts::addLocalHost()
diff --git a/src/Access/IAccessStorage.cpp b/src/Access/IAccessStorage.cpp
index ace8c3b5848..8e51481e415 100644
--- a/src/Access/IAccessStorage.cpp
+++ b/src/Access/IAccessStorage.cpp
@@ -583,7 +583,7 @@ void IAccessStorage::backup(BackupEntriesCollector & backup_entries_collector, c
         throwBackupNotAllowed();
 
     auto entities = readAllWithIDs(type);
-    boost::range::remove_erase_if(entities, [](const std::pair<UUID, AccessEntityPtr> & x) { return !x.second->isBackupAllowed(); }); // NOLINT
+    std::erase_if(entities, [](const std::pair<UUID, AccessEntityPtr> & x) { return !x.second->isBackupAllowed(); });
 
     if (entities.empty())
         return;
diff --git a/src/Access/ReplicatedAccessStorage.cpp b/src/Access/ReplicatedAccessStorage.cpp
index 2c4b49de181..cd9a86a1bd2 100644
--- a/src/Access/ReplicatedAccessStorage.cpp
+++ b/src/Access/ReplicatedAccessStorage.cpp
@@ -654,7 +654,7 @@ void ReplicatedAccessStorage::backup(BackupEntriesCollector & backup_entries_col
         throwBackupNotAllowed();
 
     auto entities = readAllWithIDs(type);
-    boost::range::remove_erase_if(entities, [](const std::pair<UUID, AccessEntityPtr> & x) { return !x.second->isBackupAllowed(); }); // NOLINT
+    std::erase_if(entities, [](const std::pair<UUID, AccessEntityPtr> & x) { return !x.second->isBackupAllowed(); });
 
     if (entities.empty())
         return;
diff --git a/src/Access/SettingsConstraints.cpp b/src/Access/SettingsConstraints.cpp
index fb596d96a55..a274f6b54f2 100644
--- a/src/Access/SettingsConstraints.cpp
+++ b/src/Access/SettingsConstraints.cpp
@@ -190,7 +190,7 @@ void SettingsConstraints::check(const Settings & current_settings, const Setting
 
 void SettingsConstraints::check(const Settings & current_settings, SettingsChanges & changes, SettingSource source) const
 {
-    boost::range::remove_erase_if( // NOLINT
+    std::erase_if(
         changes,
         [&](SettingChange & change) -> bool
         {
@@ -211,7 +211,7 @@ void SettingsConstraints::check(const MergeTreeSettings & current_settings, cons
 
 void SettingsConstraints::clamp(const Settings & current_settings, SettingsChanges & changes, SettingSource source) const
 {
-    boost::range::remove_erase_if( // NOLINT
+    std::erase_if(
         changes,
         [&](SettingChange & change) -> bool
         {
diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 52efee03ae4..e20ff4ab909 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1284,8 +1284,7 @@ private:
                         resolved_identifier->formatASTForErrorMessage(),
                         join_node.formatASTForErrorMessage());
                 }
-                if (table_side)
-                    result = *table_side;
+                result = table_side;
             }
             return result;
         }
diff --git a/src/Analyzer/QueryTreePassManager.cpp b/src/Analyzer/QueryTreePassManager.cpp
index ae812ac78fd..32d041b577a 100644
--- a/src/Analyzer/QueryTreePassManager.cpp
+++ b/src/Analyzer/QueryTreePassManager.cpp
@@ -85,9 +85,9 @@ public:
     void visitImpl(QueryTreeNodePtr & node) const
     {
         if (auto * column = node->as<ColumnNode>())
-            return visitColumn(column);
+            visitColumn(column);
         else if (auto * function = node->as<FunctionNode>())
-            return visitFunction(function);
+            visitFunction(function);
     }
 private:
     void visitColumn(ColumnNode * column) const
diff --git a/src/BridgeHelper/XDBCBridgeHelper.h b/src/BridgeHelper/XDBCBridgeHelper.h
index 838be42357a..b557e12b85b 100644
--- a/src/BridgeHelper/XDBCBridgeHelper.h
+++ b/src/BridgeHelper/XDBCBridgeHelper.h
@@ -239,7 +239,7 @@ protected:
             if (character.length() > 1)
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Failed to parse quoting style from '{}' for service {}",
                     character, BridgeHelperMixin::serviceAlias());
-            else if (character.length() == 0)
+            else if (character.empty())
                 quote_style = IdentifierQuotingStyle::None;
             else if (character[0] == '`')
                 quote_style = IdentifierQuotingStyle::Backticks;
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index 402195ca944..b3544264ff0 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -273,7 +273,7 @@ public:
     static void start(Int32 signals_before_stop = 1) { exit_after_signals.store(signals_before_stop); }
 
     /// Set value not greater then 0 to mark the query as stopped.
-    static void stop() { return exit_after_signals.store(0); }
+    static void stop() { exit_after_signals.store(0); }
 
     /// Return true if the query was stopped.
     /// Query was stopped if it received at least "signals_before_stop" interrupt signals.
@@ -2812,7 +2812,7 @@ public:
      */
     std::pair<std::string, std::string> operator()(const std::string& token) const
     {
-        if (token.find("--") != 0)
+        if (token.starts_with("--"))
             return {};
         std::string arg = token.substr(2);
 
diff --git a/src/Columns/ColumnSparse.cpp b/src/Columns/ColumnSparse.cpp
index 3c08ebbf8b4..3a63d2bffc5 100644
--- a/src/Columns/ColumnSparse.cpp
+++ b/src/Columns/ColumnSparse.cpp
@@ -577,7 +577,7 @@ void ColumnSparse::getPermutation(IColumn::PermutationSortDirection direction, I
         return;
     }
 
-    return getPermutationImpl(direction, stability, limit, null_direction_hint, res, nullptr);
+    getPermutationImpl(direction, stability, limit, null_direction_hint, res, nullptr);
 }
 
 void ColumnSparse::updatePermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
@@ -590,7 +590,7 @@ void ColumnSparse::updatePermutation(IColumn::PermutationSortDirection direction
 void ColumnSparse::getPermutationWithCollation(const Collator & collator, IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
                                 size_t limit, int null_direction_hint, Permutation & res) const
 {
-    return getPermutationImpl(direction, stability, limit, null_direction_hint, res, &collator);
+    getPermutationImpl(direction, stability, limit, null_direction_hint, res, &collator);
 }
 
 void ColumnSparse::updatePermutationWithCollation(
diff --git a/src/Common/MortonUtils.h b/src/Common/MortonUtils.h
index c55b36c6354..8af9de68b65 100644
--- a/src/Common/MortonUtils.h
+++ b/src/Common/MortonUtils.h
@@ -100,9 +100,9 @@ void intervalBinaryPartition(UInt64 first, UInt64 last, F && callback)
     chassert(split >= first);
     chassert(split <= last);
 
-    intervalBinaryPartition(first, split, std::forward<F>(callback));
+    intervalBinaryPartition(first, split, callback);
     if (split < last)
-        intervalBinaryPartition(split + 1, last, std::forward<F>(callback));
+        intervalBinaryPartition(split + 1, last, callback);
 }
 
 
diff --git a/src/Common/NetException.h b/src/Common/NetException.h
index 09c51949501..d64788ac3c6 100644
--- a/src/Common/NetException.h
+++ b/src/Common/NetException.h
@@ -11,7 +11,7 @@ class NetException : public Exception
 public:
     template <typename T>
     requires std::is_convertible_v<T, String>
-    NetException(int code, T && message) : Exception(std::forward<T>(message), code)
+    NetException(int code, T && message) : Exception(message, code)
     {
         message_format_string = tryGetStaticFormatString(message);
     }
diff --git a/src/Formats/JSONUtils.cpp b/src/Formats/JSONUtils.cpp
index acea5e7b748..4eb652a5c02 100644
--- a/src/Formats/JSONUtils.cpp
+++ b/src/Formats/JSONUtils.cpp
@@ -192,12 +192,12 @@ namespace JSONUtils
 
     void skipRowForJSONEachRow(ReadBuffer & in)
     {
-        return skipRowForJSONEachRowImpl<'{', '}'>(in);
+        skipRowForJSONEachRowImpl<'{', '}'>(in);
     }
 
     void skipRowForJSONCompactEachRow(ReadBuffer & in)
     {
-        return skipRowForJSONEachRowImpl<'[', ']'>(in);
+        skipRowForJSONEachRowImpl<'[', ']'>(in);
     }
 
     NamesAndTypesList readRowAndGetNamesAndDataTypesForJSONEachRow(ReadBuffer & in, const FormatSettings & settings, JSONInferenceInfo * inference_info)
@@ -235,7 +235,6 @@ namespace JSONUtils
         skipWhitespaceIfAny(in);
         bool first = true;
         DataTypes types;
-        String field;
         while (!in.eof() && *in.position() != ']')
         {
             if (!first)
diff --git a/src/Functions/FunctionsExternalDictionaries.h b/src/Functions/FunctionsExternalDictionaries.h
index 6cdac667e62..adf455aa3bc 100644
--- a/src/Functions/FunctionsExternalDictionaries.h
+++ b/src/Functions/FunctionsExternalDictionaries.h
@@ -1356,7 +1356,7 @@ public:
                     "Illegal type of third argument of function {}. Expected const unsigned integer.",
                     getName());
 
-            auto value = static_cast<Int64>(arguments[2].column->getInt(0));
+            Int64 value = arguments[2].column->getInt(0);
             if (value < 0)
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                     "Illegal type of third argument of function {}. Expected const unsigned integer.",
diff --git a/src/Interpreters/Access/InterpreterGrantQuery.cpp b/src/Interpreters/Access/InterpreterGrantQuery.cpp
index ed06b1d0fc6..a137404a669 100644
--- a/src/Interpreters/Access/InterpreterGrantQuery.cpp
+++ b/src/Interpreters/Access/InterpreterGrantQuery.cpp
@@ -255,7 +255,7 @@ namespace
         if (roles_to_revoke.all)
             boost::range::set_difference(all_granted_roles_set, roles_to_revoke.except_ids, std::back_inserter(roles_to_revoke_ids));
         else
-            boost::range::remove_erase_if(roles_to_revoke_ids, [&](const UUID & id) { return !all_granted_roles_set.count(id); });
+            std::erase_if(roles_to_revoke_ids, [&](const UUID & id) { return !all_granted_roles_set.count(id); });
 
         roles_to_revoke = roles_to_revoke_ids;
         current_user_access.checkAdminOption(roles_to_revoke_ids);
diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 30eb908330b..73e04687981 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -589,7 +589,7 @@ void ActionsDAG::removeUnusedActions(const std::unordered_set<const Node *> & us
         }
     }
 
-    nodes.remove_if([&](const Node & node) { return !visited_nodes.contains(&node); });
+    std::erase_if(nodes, [&](const Node & node) { return !visited_nodes.contains(&node); });
     std::erase_if(inputs, [&](const Node * node) { return !visited_nodes.contains(node); });
 }
 
diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 2db07bb77f6..45b43ae2d3a 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -1803,10 +1803,8 @@ void Aggregator::writeToTemporaryFileImpl(
         size_t block_size_rows = block.rows();
         size_t block_size_bytes = block.bytes();
 
-        if (block_size_rows > max_temporary_block_size_rows)
-            max_temporary_block_size_rows = block_size_rows;
-        if (block_size_bytes > max_temporary_block_size_bytes)
-            max_temporary_block_size_bytes = block_size_bytes;
+        max_temporary_block_size_rows = std::max(block_size_rows, max_temporary_block_size_rows);
+        max_temporary_block_size_bytes = std::max(block_size_bytes, max_temporary_block_size_bytes);
     };
 
     for (UInt32 bucket = 0; bucket < Method::Data::NUM_BUCKETS; ++bucket)
@@ -3160,7 +3158,7 @@ void Aggregator::mergeBlocks(BucketToBlocks bucket_to_blocks, AggregatedDataVari
             result.aggregates_pools.push_back(std::make_shared<Arena>());
             Arena * aggregates_pool = result.aggregates_pools.back().get();
 
-            auto task = [group = CurrentThread::getGroup(), bucket, &merge_bucket, aggregates_pool]{ return merge_bucket(bucket, aggregates_pool, group); };
+            auto task = [group = CurrentThread::getGroup(), bucket, &merge_bucket, aggregates_pool]{ merge_bucket(bucket, aggregates_pool, group); };
 
             if (thread_pool)
                 thread_pool->scheduleOrThrowOnError(task);
diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index 1ded737941c..0d33e39ffa3 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -1074,7 +1074,7 @@ void FileCache::freeSpaceRatioKeepingThreadFunc()
 
 void FileCache::iterate(IterateFunc && func, const UserID & user_id)
 {
-    return metadata.iterate([&](const LockedKey & locked_key)
+    metadata.iterate([&](const LockedKey & locked_key)
     {
         for (const auto & file_segment_metadata : locked_key)
             func(FileSegment::getInfo(file_segment_metadata.second->file_segment));
diff --git a/src/Interpreters/Cluster.cpp b/src/Interpreters/Cluster.cpp
index b15f0e4b94e..ec6283df649 100644
--- a/src/Interpreters/Cluster.cpp
+++ b/src/Interpreters/Cluster.cpp
@@ -392,10 +392,10 @@ Cluster::Cluster(const Poco::Util::AbstractConfiguration & config,
     config_prefix += ".";
 
     secret = config.getString(config_prefix + "secret", "");
-    boost::range::remove_erase(config_keys, "secret");
+    std::erase(config_keys, "secret");
 
     allow_distributed_ddl_queries = config.getBool(config_prefix + "allow_distributed_ddl_queries", true);
-    boost::range::remove_erase(config_keys, "allow_distributed_ddl_queries");
+    std::erase(config_keys, "allow_distributed_ddl_queries");
 
     if (config_keys.empty())
         throw Exception(ErrorCodes::SHARD_HAS_NO_CONNECTIONS, "No cluster elements (shard, node) specified in config at path {}", config_prefix);
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index df49b822aaa..98d6031edca 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -1394,18 +1394,18 @@ void Context::checkAccessImpl(const Args &... args) const
     return getAccess()->checkAccess(args...);
 }
 
-void Context::checkAccess(const AccessFlags & flags) const { return checkAccessImpl(flags); }
-void Context::checkAccess(const AccessFlags & flags, std::string_view database) const { return checkAccessImpl(flags, database); }
-void Context::checkAccess(const AccessFlags & flags, std::string_view database, std::string_view table) const { return checkAccessImpl(flags, database, table); }
-void Context::checkAccess(const AccessFlags & flags, std::string_view database, std::string_view table, std::string_view column) const { return checkAccessImpl(flags, database, table, column); }
-void Context::checkAccess(const AccessFlags & flags, std::string_view database, std::string_view table, const std::vector<std::string_view> & columns) const { return checkAccessImpl(flags, database, table, columns); }
-void Context::checkAccess(const AccessFlags & flags, std::string_view database, std::string_view table, const Strings & columns) const { return checkAccessImpl(flags, database, table, columns); }
+void Context::checkAccess(const AccessFlags & flags) const { checkAccessImpl(flags); }
+void Context::checkAccess(const AccessFlags & flags, std::string_view database) const { checkAccessImpl(flags, database); }
+void Context::checkAccess(const AccessFlags & flags, std::string_view database, std::string_view table) const { checkAccessImpl(flags, database, table); }
+void Context::checkAccess(const AccessFlags & flags, std::string_view database, std::string_view table, std::string_view column) const { checkAccessImpl(flags, database, table, column); }
+void Context::checkAccess(const AccessFlags & flags, std::string_view database, std::string_view table, const std::vector<std::string_view> & columns) const { checkAccessImpl(flags, database, table, columns); }
+void Context::checkAccess(const AccessFlags & flags, std::string_view database, std::string_view table, const Strings & columns) const { checkAccessImpl(flags, database, table, columns); }
 void Context::checkAccess(const AccessFlags & flags, const StorageID & table_id) const { checkAccessImpl(flags, table_id.getDatabaseName(), table_id.getTableName()); }
 void Context::checkAccess(const AccessFlags & flags, const StorageID & table_id, std::string_view column) const { checkAccessImpl(flags, table_id.getDatabaseName(), table_id.getTableName(), column); }
 void Context::checkAccess(const AccessFlags & flags, const StorageID & table_id, const std::vector<std::string_view> & columns) const { checkAccessImpl(flags, table_id.getDatabaseName(), table_id.getTableName(), columns); }
 void Context::checkAccess(const AccessFlags & flags, const StorageID & table_id, const Strings & columns) const { checkAccessImpl(flags, table_id.getDatabaseName(), table_id.getTableName(), columns); }
-void Context::checkAccess(const AccessRightsElement & element) const { return checkAccessImpl(element); }
-void Context::checkAccess(const AccessRightsElements & elements) const { return checkAccessImpl(elements); }
+void Context::checkAccess(const AccessRightsElement & element) const { checkAccessImpl(element); }
+void Context::checkAccess(const AccessRightsElements & elements) const { checkAccessImpl(elements); }
 
 std::shared_ptr<const ContextAccess> Context::getAccess() const
 {
diff --git a/src/Interpreters/DDLWorker.cpp b/src/Interpreters/DDLWorker.cpp
index 0082f9876ef..28701aa1eaf 100644
--- a/src/Interpreters/DDLWorker.cpp
+++ b/src/Interpreters/DDLWorker.cpp
@@ -922,7 +922,6 @@ void DDLWorker::cleanupQueue(Int64, const ZooKeeperPtr & zookeeper)
         String node_path = fs::path(queue_dir) / node_name;
 
         Coordination::Stat stat;
-        String dummy;
 
         try
         {
diff --git a/src/Interpreters/DatabaseCatalog.cpp b/src/Interpreters/DatabaseCatalog.cpp
index a9b0e7e7a98..0f4c8cc26a6 100644
--- a/src/Interpreters/DatabaseCatalog.cpp
+++ b/src/Interpreters/DatabaseCatalog.cpp
@@ -1438,7 +1438,7 @@ void DatabaseCatalog::checkTableCanBeRemovedOrRenamed(
     if (!check_referential_dependencies && !check_loading_dependencies)
         return;
     std::lock_guard lock{databases_mutex};
-    return checkTableCanBeRemovedOrRenamedUnlocked(table_id, check_referential_dependencies, check_loading_dependencies, is_drop_database);
+    checkTableCanBeRemovedOrRenamedUnlocked(table_id, check_referential_dependencies, check_loading_dependencies, is_drop_database);
 }
 
 void DatabaseCatalog::checkTableCanBeRemovedOrRenamedUnlocked(
diff --git a/src/Interpreters/ExpressionAnalyzer.cpp b/src/Interpreters/ExpressionAnalyzer.cpp
index fefbd67bfc1..395218f834f 100644
--- a/src/Interpreters/ExpressionAnalyzer.cpp
+++ b/src/Interpreters/ExpressionAnalyzer.cpp
@@ -336,7 +336,7 @@ void ExpressionAnalyzer::analyzeAggregation(ActionsDAGPtr & temp_actions)
                                 /// But don't remove last key column if no aggregate functions, otherwise aggregation will not work.
                                 if (!aggregate_descriptions.empty() || group_size > 1)
                                 {
-                                    if (j + 1 < static_cast<ssize_t>(group_size))
+                                    if (j + 1 < group_size)
                                         group_elements_ast[j] = std::move(group_elements_ast.back());
 
                                     group_elements_ast.pop_back();
@@ -390,7 +390,7 @@ void ExpressionAnalyzer::analyzeAggregation(ActionsDAGPtr & temp_actions)
                             /// But don't remove last key column if no aggregate functions, otherwise aggregation will not work.
                             if (!aggregate_descriptions.empty() || size > 1)
                             {
-                                if (i + 1 < static_cast<ssize_t>(size))
+                                if (i + 1 < size)
                                     group_asts[i] = std::move(group_asts.back());
 
                                 group_asts.pop_back();
diff --git a/src/Interpreters/GinFilter.cpp b/src/Interpreters/GinFilter.cpp
index b9b5697d2ee..4ad0c4098d8 100644
--- a/src/Interpreters/GinFilter.cpp
+++ b/src/Interpreters/GinFilter.cpp
@@ -1,3 +1,5 @@
+// NOLINTBEGIN(clang-analyzer-optin.core.EnumCastOutOfRange)
+
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnLowCardinality.h>
 #include <Columns/ColumnNullable.h>
@@ -174,3 +176,5 @@ bool GinFilter::match(const GinPostingsCache & postings_cache) const
 }
 
 }
+
+// NOLINTEND(clang-analyzer-optin.core.EnumCastOutOfRange)
diff --git a/src/Interpreters/GraceHashJoin.cpp b/src/Interpreters/GraceHashJoin.cpp
index 97ff84b6fb6..4dd2f89b90a 100644
--- a/src/Interpreters/GraceHashJoin.cpp
+++ b/src/Interpreters/GraceHashJoin.cpp
@@ -415,7 +415,7 @@ void GraceHashJoin::addBuckets(const size_t bucket_count)
 void GraceHashJoin::checkTypesOfKeys(const Block & block) const
 {
     chassert(hash_join);
-    return hash_join->checkTypesOfKeys(block);
+    hash_join->checkTypesOfKeys(block);
 }
 
 void GraceHashJoin::initialize(const Block & sample_block)
diff --git a/src/Interpreters/IExternalLoadable.cpp b/src/Interpreters/IExternalLoadable.cpp
index 5c2df092179..484dfbe2d97 100644
--- a/src/Interpreters/IExternalLoadable.cpp
+++ b/src/Interpreters/IExternalLoadable.cpp
@@ -22,12 +22,8 @@ UInt64 calculateDurationWithBackoff(pcg64 & rnd_engine, size_t error_count)
     constexpr UInt64 backoff_initial_sec = 5;
     constexpr UInt64 backoff_max_sec = 10 * 60; /// 10 minutes
 
-    if (error_count < 1)
-        error_count = 1;
-
     /// max seconds is 600 and 2 ** 10 == 1024
-    if (error_count > 11)
-        error_count = 11;
+    error_count = std::clamp<size_t>(error_count, 1, 11);
 
     std::uniform_int_distribution<UInt64> distribution(0, static_cast<UInt64>(std::exp2(error_count - 1)));
     return std::min<UInt64>(backoff_max_sec, backoff_initial_sec + distribution(rnd_engine));
diff --git a/src/Interpreters/ITokenExtractor.h b/src/Interpreters/ITokenExtractor.h
index fdcc9880bff..2423ef12311 100644
--- a/src/Interpreters/ITokenExtractor.h
+++ b/src/Interpreters/ITokenExtractor.h
@@ -32,7 +32,7 @@ struct ITokenExtractor
 
     virtual void stringPaddedToBloomFilter(const char * data, size_t length, BloomFilter & bloom_filter) const
     {
-        return stringToBloomFilter(data, length, bloom_filter);
+        stringToBloomFilter(data, length, bloom_filter);
     }
 
     virtual void stringLikeToBloomFilter(const char * data, size_t length, BloomFilter & bloom_filter) const = 0;
@@ -41,7 +41,7 @@ struct ITokenExtractor
 
     virtual void stringPaddedToGinFilter(const char * data, size_t length, GinFilter & gin_filter) const
     {
-        return stringToGinFilter(data, length, gin_filter);
+        stringToGinFilter(data, length, gin_filter);
     }
 
     virtual void stringLikeToGinFilter(const char * data, size_t length, GinFilter & gin_filter) const = 0;
diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index 7adc6d424fa..4f6c1c5f18b 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -1417,8 +1417,7 @@ bool MutationsInterpreter::isAffectingAllColumns() const
 
 void MutationsInterpreter::MutationKind::set(const MutationKindEnum & kind)
 {
-    if (mutation_kind < kind)
-        mutation_kind = kind;
+    mutation_kind = std::max(mutation_kind, kind);
 }
 
 }
diff --git a/src/Interpreters/RewriteCountDistinctVisitor.cpp b/src/Interpreters/RewriteCountDistinctVisitor.cpp
index cf28d8abb87..2a898f8789b 100644
--- a/src/Interpreters/RewriteCountDistinctVisitor.cpp
+++ b/src/Interpreters/RewriteCountDistinctVisitor.cpp
@@ -42,7 +42,6 @@ void RewriteCountDistinctFunctionMatcher::visit(ASTPtr & ast, Data & /*data*/)
     auto cloned_select_query = selectq->clone();
     expr_list->children[0] = makeASTFunction("count");
 
-    auto table_name = table_expr->database_and_table_name->as<ASTTableIdentifier>()->name();
     table_expr->children.clear();
     table_expr->children.emplace_back(std::make_shared<ASTSubquery>());
     table_expr->database_and_table_name = nullptr;
diff --git a/src/Interpreters/ServerAsynchronousMetrics.cpp b/src/Interpreters/ServerAsynchronousMetrics.cpp
index 4f8b03a5eaa..315202cc01d 100644
--- a/src/Interpreters/ServerAsynchronousMetrics.cpp
+++ b/src/Interpreters/ServerAsynchronousMetrics.cpp
@@ -251,7 +251,7 @@ void ServerAsynchronousMetrics::updateImpl(TimePoint update_time, TimePoint curr
         size_t max_part_count_for_partition = 0;
 
         size_t number_of_databases = 0;
-        for (auto [db_name, _] : databases)
+        for (const auto & [db_name, _] : databases)
             if (db_name != DatabaseCatalog::TEMPORARY_DATABASE)
                 ++number_of_databases; /// filter out the internal database for temporary tables, system table "system.databases" behaves the same way
 
diff --git a/src/Interpreters/TreeOptimizer.cpp b/src/Interpreters/TreeOptimizer.cpp
index 2d0c9ba1a37..bbd47933ec5 100644
--- a/src/Interpreters/TreeOptimizer.cpp
+++ b/src/Interpreters/TreeOptimizer.cpp
@@ -174,10 +174,9 @@ void optimizeGroupBy(ASTSelectQuery * select_query, ContextPtr context)
             const auto & erase_position = group_exprs.begin() + i;
             group_exprs.erase(erase_position);
             const auto & insert_position = group_exprs.begin() + i;
-            std::remove_copy_if(
-                    std::begin(args_ast->children), std::end(args_ast->children),
-                    std::inserter(group_exprs, insert_position), is_literal
-            );
+            (void)std::remove_copy_if(
+                std::begin(args_ast->children), std::end(args_ast->children),
+                std::inserter(group_exprs, insert_position), is_literal);
         }
         else if (is_literal(group_exprs[i]))
         {
diff --git a/src/Parsers/ASTBackupQuery.cpp b/src/Parsers/ASTBackupQuery.cpp
index bc1dbfc961d..5a5cb97fa5f 100644
--- a/src/Parsers/ASTBackupQuery.cpp
+++ b/src/Parsers/ASTBackupQuery.cpp
@@ -180,7 +180,7 @@ namespace
         if (settings)
             changes = assert_cast<ASTSetQuery *>(settings.get())->changes;
 
-        boost::remove_erase_if( // NOLINT
+        std::erase_if(
             changes,
             [](const SettingChange & change)
             {
diff --git a/src/Parsers/Access/ParserGrantQuery.cpp b/src/Parsers/Access/ParserGrantQuery.cpp
index 42af7d1cda4..e79d14f860a 100644
--- a/src/Parsers/Access/ParserGrantQuery.cpp
+++ b/src/Parsers/Access/ParserGrantQuery.cpp
@@ -219,7 +219,7 @@ namespace
 
     void throwIfNotGrantable(AccessRightsElements & elements)
     {
-        boost::range::remove_erase_if(elements, [](AccessRightsElement & element) // NOLINT
+        std::erase_if(elements, [](AccessRightsElement & element)
         {
             if (element.empty())
                 return true;
diff --git a/src/Parsers/ParserBackupQuery.cpp b/src/Parsers/ParserBackupQuery.cpp
index 6a86edd7e2f..6d2f4d8311d 100644
--- a/src/Parsers/ParserBackupQuery.cpp
+++ b/src/Parsers/ParserBackupQuery.cpp
@@ -304,7 +304,7 @@ namespace
             changes = assert_cast<ASTSetQuery *>(settings.get())->changes;
         }
 
-        boost::remove_erase_if(changes, [](const SettingChange & change) { return change.name == "async"; }); // NOLINT
+        std::erase_if(changes, [](const SettingChange & change) { return change.name == "async"; }); // NOLINT
         changes.emplace_back("async", async);
 
         auto new_settings = std::make_shared<ASTSetQuery>();
diff --git a/src/Parsers/makeASTForLogicalFunction.cpp b/src/Parsers/makeASTForLogicalFunction.cpp
index 416441f210b..0d8b1f8c0dc 100644
--- a/src/Parsers/makeASTForLogicalFunction.cpp
+++ b/src/Parsers/makeASTForLogicalFunction.cpp
@@ -12,7 +12,7 @@ namespace DB
 ASTPtr makeASTForLogicalAnd(ASTs && arguments)
 {
     bool partial_result = true;
-    boost::range::remove_erase_if(arguments, [&](const ASTPtr & argument) -> bool // NOLINT
+    std::erase_if(arguments, [&](const ASTPtr & argument)
     {
         bool b;
         if (!tryGetLiteralBool(argument.get(), b))
@@ -41,7 +41,7 @@ ASTPtr makeASTForLogicalAnd(ASTs && arguments)
 ASTPtr makeASTForLogicalOr(ASTs && arguments)
 {
     bool partial_result = false;
-    boost::range::remove_erase_if(arguments, [&](const ASTPtr & argument) -> bool // NOLINT
+    std::erase_if(arguments, [&](const ASTPtr & argument)
     {
         bool b;
         if (!tryGetLiteralBool(argument.get(), b))
diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index fb21f46301d..0b8692a6751 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -596,7 +596,7 @@ namespace
             std::tie(new_pos, new_size) = callback();
             if (!new_size)
                 return false;
-            BufferBase::set(static_cast<BufferBase::Position>(const_cast<void *>(new_pos)), new_size, 0);
+            BufferBase::set(static_cast<BufferBase::Position>(const_cast<char *>(new_pos)), new_size, 0);
             return true;
         }
 
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index aff9906d289..e1ddd89322f 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -1872,7 +1872,7 @@ void TCPHandler::receiveQuery()
     if (state.part_uuids_to_ignore)
         query_context->getIgnoredPartUUIDs()->add(*state.part_uuids_to_ignore);
 
-    query_context->setProgressCallback([this] (const Progress & value) { return this->updateProgress(value); });
+    query_context->setProgressCallback([this] (const Progress & value) { this->updateProgress(value); });
     query_context->setFileProgressCallback([this](const FileProgress & value) { this->updateProgress(Progress(value)); });
 
     ///
diff --git a/src/Storages/AlterCommands.cpp b/src/Storages/AlterCommands.cpp
index 6f9161c0c0a..ef6c5f7362c 100644
--- a/src/Storages/AlterCommands.cpp
+++ b/src/Storages/AlterCommands.cpp
@@ -1224,7 +1224,7 @@ void AlterCommands::prepare(const StorageInMemoryMetadata & metadata)
 
             if (has_column)
             {
-                auto column_from_table = columns.get(command.column_name);
+                const auto & column_from_table = columns.get(command.column_name);
                 if (command.data_type && !command.default_expression && column_from_table.default_desc.expression)
                 {
                     command.default_kind = column_from_table.default_desc.kind;
@@ -1566,7 +1566,7 @@ void AlterCommands::validate(const StoragePtr & table, ContextPtr context) const
             } /// if we change data type for column with default
             else if (all_columns.has(column_name) && command.data_type)
             {
-                auto column_in_table = all_columns.get(column_name);
+                const auto & column_in_table = all_columns.get(column_name);
                 /// Column doesn't have a default, nothing to check
                 if (!column_in_table.default_desc.expression)
                     continue;
diff --git a/src/Storages/Distributed/DistributedSink.cpp b/src/Storages/Distributed/DistributedSink.cpp
index b89a8d7bcfd..1906aa74c97 100644
--- a/src/Storages/Distributed/DistributedSink.cpp
+++ b/src/Storages/Distributed/DistributedSink.cpp
@@ -173,7 +173,10 @@ void DistributedSink::writeAsync(const Block & block)
     else
     {
         if (storage.getShardingKeyExpr() && (cluster->getShardsInfo().size() > 1))
-            return writeSplitAsync(block);
+        {
+            writeSplitAsync(block);
+            return;
+        }
 
         writeAsyncImpl(block);
         ++inserted_blocks;
diff --git a/src/Storages/MaterializedView/RefreshSet.cpp b/src/Storages/MaterializedView/RefreshSet.cpp
index 0125b958a41..a3ef327dc24 100644
--- a/src/Storages/MaterializedView/RefreshSet.cpp
+++ b/src/Storages/MaterializedView/RefreshSet.cpp
@@ -116,7 +116,7 @@ RefreshSet::InfoContainer RefreshSet::getInfo() const
     lock.unlock();
 
     InfoContainer res;
-    for (auto [id, task] : tasks_copy)
+    for (const auto & [id, task] : tasks_copy)
         res.push_back(task->getInfo());
     return res;
 }
diff --git a/src/Storages/MergeTree/GinIndexStore.cpp b/src/Storages/MergeTree/GinIndexStore.cpp
index 9e24d9f018d..6e0273701ad 100644
--- a/src/Storages/MergeTree/GinIndexStore.cpp
+++ b/src/Storages/MergeTree/GinIndexStore.cpp
@@ -1,3 +1,5 @@
+// NOLINTBEGIN(clang-analyzer-optin.core.EnumCastOutOfRange)
+
 #include <Storages/MergeTree/GinIndexStore.h>
 #include <Columns/ColumnString.h>
 #include <Common/FST.h>
@@ -504,3 +506,5 @@ void GinIndexStoreFactory::remove(const String & part_path)
 }
 
 }
+
+// NOLINTEND(clang-analyzer-optin.core.EnumCastOutOfRange)
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 8124a4e516d..34bab967c7f 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1938,7 +1938,6 @@ void IMergeTreeDataPart::remove()
 std::optional<String> IMergeTreeDataPart::getRelativePathForPrefix(const String & prefix, bool detached, bool broken) const
 {
     assert(!broken || detached);
-    String res;
 
     /** If you need to detach a part, and directory into which we want to rename it already exists,
         *  we will rename to the directory with the name to which the suffix is added in the form of "_tryN".
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index 16453e35425..849240502e4 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -1185,8 +1185,7 @@ bool KeyCondition::tryPrepareSetIndex(
         {
             indexes_mapping.push_back(index_mapping);
             data_types.push_back(data_type);
-            if (out_key_column_num < index_mapping.key_index)
-                out_key_column_num = index_mapping.key_index;
+            out_key_column_num = std::max(out_key_column_num, index_mapping.key_index);
         }
     };
 
diff --git a/src/Storages/MergeTree/LevelMergeSelector.cpp b/src/Storages/MergeTree/LevelMergeSelector.cpp
deleted file mode 100644
index 67495c1372d..00000000000
--- a/src/Storages/MergeTree/LevelMergeSelector.cpp
+++ /dev/null
@@ -1,118 +0,0 @@
-#include <Storages/MergeTree/LevelMergeSelector.h>
-
-#include <cmath>
-
-
-namespace DB
-{
-
-namespace
-{
-
-/** Estimates best set of parts to merge within passed alternatives.
-  * It is selected simply: by minimal size.
-  */
-struct Estimator
-{
-    using Iterator = LevelMergeSelector::PartsRange::const_iterator;
-
-    void consider(Iterator begin, Iterator end, size_t sum_size)
-    {
-        double current_score = sum_size;
-
-        if (min_score == 0.0 || current_score < min_score)
-        {
-            min_score = current_score;
-            best_begin = begin;
-            best_end = end;
-        }
-    }
-
-    LevelMergeSelector::PartsRange getBest() const
-    {
-        return LevelMergeSelector::PartsRange(best_begin, best_end);
-    }
-
-    double min_score = 0.0;
-    Iterator best_begin {};
-    Iterator best_end {};
-};
-
-
-void selectWithinPartition(
-    const LevelMergeSelector::PartsRange & parts,
-    const size_t max_total_size_to_merge,
-    Estimator & estimator,
-    const LevelMergeSelector::Settings & settings)
-{
-    size_t parts_size = parts.size();
-    if (parts_size < settings.parts_to_merge)
-        return;
-
-    /// To easily calculate sum size in any range.
-    size_t parts_count = parts.size();
-    size_t prefix_sum = 0;
-    std::vector<size_t> prefix_sums(parts.size() + 1);
-
-    for (size_t i = 0; i < parts_count; ++i)
-    {
-        prefix_sum += parts[i].size;
-        prefix_sums[i + 1] = prefix_sum;
-    }
-
-    /// Use "corrected" level. It will be non-decreasing while traversing parts right to left.
-    /// This is done for compatibility with another algorithms.
-    size_t corrected_level_at_left = 0;
-    size_t corrected_level_at_right = 0;
-
-    size_t range_end = parts_size;
-    size_t range_begin = range_end - settings.parts_to_merge;
-
-    for (size_t i = range_begin; i < range_end; ++i)
-        if (corrected_level_at_left < parts[i].level)
-            corrected_level_at_left = parts[i].level;
-
-    while (true)
-    {
-        if (corrected_level_at_left < parts[range_begin].level)
-            corrected_level_at_left = parts[range_begin].level;
-
-        if (corrected_level_at_right < parts[range_end - 1].level)
-            corrected_level_at_right = parts[range_end - 1].level;
-
-        /// Leftmost range of same corrected level.
-        if (corrected_level_at_left == corrected_level_at_right
-            && (range_begin == 0 || parts[range_begin - 1].level > corrected_level_at_left))
-        {
-            size_t range_size = prefix_sums[range_end] - prefix_sums[range_begin];
-
-            if (range_size <= max_total_size_to_merge)
-                estimator.consider(parts.begin() + range_begin, parts.begin() + range_end, range_size);
-
-            break;    /// Minimum level is enough.
-        }
-
-        if (range_begin == 0)
-            break;
-
-        --range_begin;
-        --range_end;
-    }
-}
-
-}
-
-
-LevelMergeSelector::PartsRange LevelMergeSelector::select(
-    const PartsRanges & parts_ranges,
-    size_t max_total_size_to_merge)
-{
-    Estimator estimator;
-
-    for (const auto & parts_range: parts_ranges)
-        selectWithinPartition(parts_range, max_total_size_to_merge, estimator, settings);
-
-    return estimator.getBest();
-}
-
-}
diff --git a/src/Storages/MergeTree/LevelMergeSelector.h b/src/Storages/MergeTree/LevelMergeSelector.h
deleted file mode 100644
index f4080c379c4..00000000000
--- a/src/Storages/MergeTree/LevelMergeSelector.h
+++ /dev/null
@@ -1,30 +0,0 @@
-#pragma once
-
-#include <Storages/MergeTree/MergeSelector.h>
-
-
-namespace DB
-{
-
-/** Select parts to merge based on its level.
-  * Select first range of parts of parts_to_merge length with minimum level.
-  */
-class LevelMergeSelector : public IMergeSelector
-{
-public:
-    struct Settings
-    {
-        size_t parts_to_merge = 10;
-    };
-
-    explicit LevelMergeSelector(const Settings & settings_) : settings(settings_) {}
-
-    PartsRange select(
-        const PartsRanges & parts_ranges,
-        size_t max_total_size_to_merge) override;
-
-private:
-    const Settings settings;
-};
-
-}
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index 34e17e40a74..a9109832521 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -543,7 +543,7 @@ bool MergeTask::VerticalMergeStage::prepareVerticalMergeForAllColumns() const
     }
     /// Move ownership from std::unique_ptr<ReadBuffer> to std::unique_ptr<ReadBufferFromFile> for CompressedReadBufferFromFile.
     /// First, release ownership from unique_ptr to base type.
-    reread_buf.release(); /// NOLINT(bugprone-unused-return-value): we already have the pointer value in `reread_buffer_raw`
+    reread_buf.release(); /// NOLINT(bugprone-unused-return-value,hicpp-ignored-remove-result): we already have the pointer value in `reread_buffer_raw`
     /// Then, move ownership to unique_ptr to concrete type.
     std::unique_ptr<ReadBufferFromFile> reread_buffer_from_file(reread_buffer_raw);
     /// CompressedReadBufferFromFile expects std::unique_ptr<ReadBufferFromFile> as argument.
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 052e8706db0..cf3e81450dd 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5484,7 +5484,7 @@ void MergeTreeData::restorePartsFromBackup(RestorerFromBackup & restorer, const
 
     auto backup = restorer.getBackup();
     Strings part_names = backup->listFiles(data_path_in_backup, /*recursive*/ false);
-    boost::remove_erase(part_names, "mutations");
+    std::erase(part_names, "mutations");
 
     bool restore_broken_parts_as_detached = restorer.getRestoreSettings().restore_broken_parts_as_detached;
 
diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index ddeaf69136a..cd18e8d5a28 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -94,7 +94,7 @@ namespace
         }
         void operator() (const IPv6 & x) const
         {
-            return operator()(String(reinterpret_cast<const char *>(&x), 16));
+            operator()(String(reinterpret_cast<const char *>(&x), 16));
         }
         void operator() (const Float64 & x) const
         {
diff --git a/src/Storages/MergeTree/MergeTreeRangeReader.cpp b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
index eb757e1d8c7..73e16ec8733 100644
--- a/src/Storages/MergeTree/MergeTreeRangeReader.cpp
+++ b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
@@ -681,8 +681,9 @@ size_t numZerosInTail(const UInt8 * begin, const UInt8 * end)
             return count;
         }
     }
-    while (end > begin && *(--end) == 0)
+    while (end > begin && end[-1] == 0)
     {
+        --end;
         ++count;
     }
     return count;
@@ -715,8 +716,9 @@ size_t numZerosInTail(const UInt8 * begin, const UInt8 * end)
             return count;
         }
     }
-    while (end > begin && *(--end) == 0)
+    while (end > begin && end[-1] == 0)
     {
+        --end;
         ++count;
     }
     return count;
@@ -793,8 +795,9 @@ size_t MergeTreeRangeReader::ReadResult::numZerosInTail(const UInt8 * begin, con
     }
 #endif
 
-    while (end > begin && *(--end) == 0)
+    while (end > begin && end[-1] == 0)
     {
+        --end;
         ++count;
     }
     return count;
diff --git a/src/Storages/MergeTree/MergeTreeReadPool.cpp b/src/Storages/MergeTree/MergeTreeReadPool.cpp
index e525f7f5f65..dc1ba030f45 100644
--- a/src/Storages/MergeTree/MergeTreeReadPool.cpp
+++ b/src/Storages/MergeTree/MergeTreeReadPool.cpp
@@ -80,8 +80,7 @@ MergeTreeReadPool::MergeTreeReadPool(
             /// We're taking min here because number of tasks shouldn't be too low - it will make task stealing impossible.
             const auto heuristic_min_marks = std::min<size_t>(total_marks / pool_settings.threads, min_bytes_per_task / avg_mark_bytes);
 
-            if (heuristic_min_marks > min_marks_for_concurrent_read)
-                min_marks_for_concurrent_read = heuristic_min_marks;
+            min_marks_for_concurrent_read = std::max(heuristic_min_marks, min_marks_for_concurrent_read);
         }
     }
 
diff --git a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
index 99ad8aa085d..2a4ff74714d 100644
--- a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
+++ b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
@@ -986,7 +986,7 @@ void ParallelReplicasReadingCoordinator::handleInitialAllRangesAnnouncement(Init
         initialize();
     }
 
-    return pimpl->handleInitialAllRangesAnnouncement(std::move(announcement));
+    pimpl->handleInitialAllRangesAnnouncement(std::move(announcement));
 }
 
 ParallelReadResponse ParallelReplicasReadingCoordinator::handleRequest(ParallelReadRequest request)
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.cpp
index 67942491ae2..e034918ef57 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeCleanupThread.cpp
@@ -79,10 +79,7 @@ void ReplicatedMergeTreeCleanupThread::run()
         else
             sleep_ms = static_cast<UInt64>(sleep_ms / ratio);
 
-        if (sleep_ms < storage_settings->cleanup_delay_period * 1000)
-            sleep_ms = storage_settings->cleanup_delay_period * 1000;
-        if (storage_settings->max_cleanup_delay_period * 1000 < sleep_ms)
-            sleep_ms = storage_settings->max_cleanup_delay_period * 1000;
+        sleep_ms = std::clamp(sleep_ms, storage_settings->cleanup_delay_period * 1000, storage_settings->max_cleanup_delay_period * 1000);
 
         UInt64 interval_ms = now_ms - prev_timestamp;
         LOG_TRACE(log, "Scheduling next cleanup after {}ms (points: {}, interval: {}ms, ratio: {}, points per minute: {})",
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.cpp
index 9eb8b6ce24c..08ddbbd60c4 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeLogEntry.cpp
@@ -28,7 +28,7 @@ enum FormatVersion : UInt8
     FORMAT_WITH_DEDUPLICATE_BY_COLUMNS = 6,
     FORMAT_WITH_LOG_ENTRY_ID = 7,
 
-    FORMAT_LAST
+    FORMAT_LAST = 8,
 };
 
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
index 86b28f72e19..4b4f4c33e7d 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
@@ -113,7 +113,7 @@ namespace
     inline String toString(const std::vector<T> & vec)
     {
         size_t size = vec.size();
-        if (size > 50) size = 50;
+        size = std::min<size_t>(size, 50);
         return fmt::format("({})", fmt::join(vec.begin(), vec.begin() + size, ","));
     }
 }
diff --git a/src/Storages/PartitionedSink.cpp b/src/Storages/PartitionedSink.cpp
index 69940990569..09b009b26d8 100644
--- a/src/Storages/PartitionedSink.cpp
+++ b/src/Storages/PartitionedSink.cpp
@@ -1,3 +1,5 @@
+// NOLINTBEGIN(clang-analyzer-optin.core.EnumCastOutOfRange)
+
 #include "PartitionedSink.h"
 
 #include <Common/ArenaUtils.h>
@@ -145,3 +147,5 @@ String PartitionedSink::replaceWildcards(const String & haystack, const String &
 }
 
 }
+
+// NOLINTEND(clang-analyzer-optin.core.EnumCastOutOfRange)
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index ed2f8d2ec1b..e902c60f780 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -600,11 +600,13 @@ void S3QueueFilesMetadata::setFileProcessed(ProcessingNodeHolderPtr holder)
     {
         case S3QueueMode::ORDERED:
         {
-            return setFileProcessedForOrderedMode(holder);
+            setFileProcessedForOrderedMode(holder);
+            break;
         }
         case S3QueueMode::UNORDERED:
         {
-            return setFileProcessedForUnorderedMode(holder);
+            setFileProcessedForUnorderedMode(holder);
+            break;
         }
     }
 }
@@ -649,7 +651,7 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
         ? zookeeper_processed_path / toString(getProcessingIdForPath(holder->path))
         : zookeeper_processed_path;
 
-    return setFileProcessedForOrderedModeImpl(holder->path, holder, processed_node_path);
+    setFileProcessedForOrderedModeImpl(holder->path, holder, processed_node_path);
 }
 
 void S3QueueFilesMetadata::setFileProcessedForOrderedModeImpl(
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index b6daadf8bc4..c267e3f1f25 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -617,10 +617,10 @@ std::shared_ptr<StorageS3Queue::FileIterator> StorageS3Queue::createFileIterator
     return std::make_shared<FileIterator>(files_metadata, std::move(glob_iterator), s3queue_settings->s3queue_current_shard_num, shutdown_called);
 }
 
-void registerStorageS3QueueImpl(const String & name, StorageFactory & factory)
+void registerStorageS3Queue(StorageFactory & factory)
 {
     factory.registerStorage(
-        name,
+        "S3Queue",
         [](const StorageFactory::Arguments & args)
         {
             auto & engine_args = args.engine_args;
@@ -683,11 +683,6 @@ void registerStorageS3QueueImpl(const String & name, StorageFactory & factory)
         });
 }
 
-void registerStorageS3Queue(StorageFactory & factory)
-{
-    return registerStorageS3QueueImpl("S3Queue", factory);
-}
-
 }
 
 
diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index 65af5145bec..d9a0b2b4d59 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -281,7 +281,7 @@ void StorageBuffer::read(
                 if (!dest_columns.hasPhysical(column_name))
                 {
                     LOG_WARNING(log, "Destination table {} doesn't have column {}. The default values are used.", destination_id.getNameForLogs(), backQuoteIfNeed(column_name));
-                    boost::range::remove_erase(columns_intersection, column_name);
+                    std::erase(columns_intersection, column_name);
                     continue;
                 }
                 const auto & dst_col = dest_columns.getPhysical(column_name);
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 69d3cf3ad3b..7b5916c0273 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -193,8 +193,7 @@ UInt64 getMaximumFileNumber(const std::string & dir_path)
             throw;
         }
 
-        if (num > res)
-            res = num;
+        res = std::max(num, res);
     }
 
     return res;
diff --git a/src/Storages/StorageFuzzJSON.cpp b/src/Storages/StorageFuzzJSON.cpp
index fbfc67f4c7c..9950d41f1c2 100644
--- a/src/Storages/StorageFuzzJSON.cpp
+++ b/src/Storages/StorageFuzzJSON.cpp
@@ -458,7 +458,7 @@ void fuzzJSONObject(
 void fuzzJSONObject(std::shared_ptr<JSONNode> n, WriteBuffer & out, const StorageFuzzJSON::Configuration & config, pcg64 & rnd)
 {
     size_t node_count = 0;
-    return fuzzJSONObject(n, out, config, rnd, /*depth*/ 0, node_count);
+    fuzzJSONObject(n, out, config, rnd, /*depth*/ 0, node_count);
 }
 
 class FuzzJSONSource : public ISource
diff --git a/src/Storages/StorageKeeperMap.cpp b/src/Storages/StorageKeeperMap.cpp
index b0b7afdfe8d..20f99070000 100644
--- a/src/Storages/StorageKeeperMap.cpp
+++ b/src/Storages/StorageKeeperMap.cpp
@@ -846,7 +846,7 @@ void StorageKeeperMap::restoreDataImpl(
     bool allow_non_empty_tables,
     const DiskPtr & temporary_disk)
 {
-    auto table_id = toString(getStorageID().uuid);
+    const auto & table_id = toString(getStorageID().uuid);
 
     fs::path data_path_in_backup_fs = data_path_in_backup;
 
@@ -960,7 +960,7 @@ std::optional<bool> StorageKeeperMap::isTableValid() const
 {
     std::lock_guard lock{init_mutex};
     if (table_is_valid.has_value())
-        return *table_is_valid;
+        return table_is_valid;
 
     [&]
     {
diff --git a/src/Storages/StorageLog.cpp b/src/Storages/StorageLog.cpp
index b652750346f..25c48de94e1 100644
--- a/src/Storages/StorageLog.cpp
+++ b/src/Storages/StorageLog.cpp
@@ -833,8 +833,7 @@ Pipe StorageLog::read(
     size_t num_marks = marks_with_real_row_count.size();
 
     size_t max_streams = use_marks_file ? num_marks : 1;
-    if (num_streams > max_streams)
-        num_streams = max_streams;
+    num_streams = std::min(num_streams, max_streams);
 
     std::vector<size_t> offsets;
     offsets.resize(num_data_files, 0);
diff --git a/src/Storages/StorageMaterializedView.cpp b/src/Storages/StorageMaterializedView.cpp
index 7e27b1d5005..4f2790ac24a 100644
--- a/src/Storages/StorageMaterializedView.cpp
+++ b/src/Storages/StorageMaterializedView.cpp
@@ -602,7 +602,7 @@ void StorageMaterializedView::backupData(BackupEntriesCollector & backup_entries
 void StorageMaterializedView::restoreDataFromBackup(RestorerFromBackup & restorer, const String & data_path_in_backup, const std::optional<ASTs> & partitions)
 {
     if (hasInnerTable())
-        return getTargetTable()->restoreDataFromBackup(restorer, data_path_in_backup, partitions);
+        getTargetTable()->restoreDataFromBackup(restorer, data_path_in_backup, partitions);
 }
 
 bool StorageMaterializedView::supportsBackupPartition() const
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 5eceddfe06d..7afa480149f 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -472,7 +472,7 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
     {
         size_t tables_count = selected_tables.size();
         Float64 num_streams_multiplier = std::min(
-            static_cast<size_t>(tables_count),
+            tables_count,
             std::max(1UL, static_cast<size_t>(context->getSettingsRef().max_streams_multiplier_for_merge_tables)));
         size_t num_streams = static_cast<size_t>(requested_num_streams * num_streams_multiplier);
 
@@ -519,7 +519,7 @@ std::vector<ReadFromMerge::ChildPlan> ReadFromMerge::createChildrenPlans(SelectQ
 
     size_t tables_count = selected_tables.size();
     Float64 num_streams_multiplier
-        = std::min(static_cast<size_t>(tables_count), std::max(1UL, static_cast<size_t>(context->getSettingsRef().max_streams_multiplier_for_merge_tables)));
+        = std::min(tables_count, std::max(1UL, static_cast<size_t>(context->getSettingsRef().max_streams_multiplier_for_merge_tables)));
     size_t num_streams = static_cast<size_t>(requested_num_streams * num_streams_multiplier);
     size_t remaining_streams = num_streams;
 
diff --git a/src/Storages/StorageMongoDB.cpp b/src/Storages/StorageMongoDB.cpp
index 64bb2f4609b..62a2a048642 100644
--- a/src/Storages/StorageMongoDB.cpp
+++ b/src/Storages/StorageMongoDB.cpp
@@ -192,7 +192,7 @@ private:
         else if (which.isFloat32())
             document.add(name, static_cast<Float64>(column.getFloat32(idx)));
         else if (which.isFloat64())
-            document.add(name, static_cast<Float64>(column.getFloat64(idx)));
+            document.add(name, column.getFloat64(idx));
         else if (which.isDate())
             document.add(name, Poco::Timestamp(DateLUT::instance().fromDayNum(DayNum(column.getUInt(idx))) * 1000000));
         else if (which.isDateTime())
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 919118b283f..cc6599f8cd1 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -1983,7 +1983,6 @@ MergeTreeData::MutableDataPartPtr StorageReplicatedMergeTree::attachPartHelperFo
         return {};
 
     const MergeTreePartInfo actual_part_info = MergeTreePartInfo::fromPartName(entry.new_part_name, format_version);
-    const String part_new_name = actual_part_info.getPartNameV1();
 
     for (const DiskPtr & disk : getStoragePolicy()->getDisks())
     {
@@ -3916,12 +3915,9 @@ void StorageReplicatedMergeTree::mergeSelectingTask()
     else if (result == AttemptStatus::CannotSelect)
         new_sleep_ms *= storage_settings_ptr->merge_selecting_sleep_slowdown_factor;
     new_sleep_ms *= std::uniform_real_distribution<Float32>(1.f, 1.1f)(thread_local_rng);
-    merge_selecting_sleep_ms = static_cast<UInt64>(new_sleep_ms);
-
-    if (merge_selecting_sleep_ms < storage_settings_ptr->merge_selecting_sleep_ms)
-        merge_selecting_sleep_ms = storage_settings_ptr->merge_selecting_sleep_ms;
-    if (merge_selecting_sleep_ms > storage_settings_ptr->max_merge_selecting_sleep_ms)
-        merge_selecting_sleep_ms = storage_settings_ptr->max_merge_selecting_sleep_ms;
+    merge_selecting_sleep_ms = std::clamp<UInt64>(static_cast<UInt64>(new_sleep_ms),
+        storage_settings_ptr->merge_selecting_sleep_ms,
+        storage_settings_ptr->max_merge_selecting_sleep_ms);
 
     if (result == AttemptStatus::EntryCreated)
         merge_selecting_task->schedule();
@@ -5450,12 +5446,11 @@ void StorageReplicatedMergeTree::read(
     /// 2. Do not read parts that have not yet been written to the quorum of the replicas.
     /// For this you have to synchronously go to ZooKeeper.
     if (settings.select_sequential_consistency)
-        return readLocalSequentialConsistencyImpl(query_plan, column_names, storage_snapshot, query_info, local_context, max_block_size, num_streams);
-
-    if (local_context->canUseParallelReplicasOnInitiator())
-        return readParallelReplicasImpl(query_plan, column_names, query_info, local_context, processed_stage);
-
-    readLocalImpl(query_plan, column_names, storage_snapshot, query_info, local_context, max_block_size, num_streams);
+        readLocalSequentialConsistencyImpl(query_plan, column_names, storage_snapshot, query_info, local_context, max_block_size, num_streams);
+    else if (local_context->canUseParallelReplicasOnInitiator())
+        readParallelReplicasImpl(query_plan, column_names, query_info, local_context, processed_stage);
+    else
+        readLocalImpl(query_plan, column_names, storage_snapshot, query_info, local_context, max_block_size, num_streams);
 }
 
 void StorageReplicatedMergeTree::readLocalSequentialConsistencyImpl(
@@ -7158,8 +7153,7 @@ void StorageReplicatedMergeTree::getReplicaDelays(time_t & out_absolute_delay, t
             break;
         }
 
-        if (replica_time > max_replicas_unprocessed_insert_time)
-            max_replicas_unprocessed_insert_time = replica_time;
+        max_replicas_unprocessed_insert_time = std::max(replica_time, max_replicas_unprocessed_insert_time);
     }
 
     if (have_replica_with_nothing_unprocessed)
@@ -7760,7 +7754,7 @@ void StorageReplicatedMergeTree::removePartsFromZooKeeperWithRetries(PartsToRemo
     for (const auto & part : parts)
         part_names_to_remove.emplace_back(part.getPartName());
 
-    return removePartsFromZooKeeperWithRetries(part_names_to_remove, max_retries);
+    removePartsFromZooKeeperWithRetries(part_names_to_remove, max_retries);
 }
 
 void StorageReplicatedMergeTree::removePartsFromZooKeeperWithRetries(const Strings & part_names, size_t max_retries)
@@ -8622,9 +8616,9 @@ void StorageReplicatedMergeTree::getCommitPartOps(
     const String & block_id_path) const
 {
     if (block_id_path.empty())
-        return getCommitPartOps(ops, part, std::vector<String>());
+        getCommitPartOps(ops, part, std::vector<String>());
     else
-        return getCommitPartOps(ops, part, std::vector<String>({block_id_path}));
+        getCommitPartOps(ops, part, std::vector<String>({block_id_path}));
 }
 
 void StorageReplicatedMergeTree::getCommitPartOps(
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 56417369869..6fb1fcb1ceb 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -2048,17 +2048,9 @@ void registerStorageS3Impl(const String & name, StorageFactory & factory)
 
 void registerStorageS3(StorageFactory & factory)
 {
-    return registerStorageS3Impl("S3", factory);
-}
-
-void registerStorageCOS(StorageFactory & factory)
-{
-    return registerStorageS3Impl("COSN", factory);
-}
-
-void registerStorageOSS(StorageFactory & factory)
-{
-    return registerStorageS3Impl("OSS", factory);
+    registerStorageS3Impl("S3", factory);
+    registerStorageS3Impl("COSN", factory);
+    registerStorageS3Impl("OSS", factory);
 }
 
 bool StorageS3::supportsPartitionBy() const
diff --git a/src/Storages/StorageStripeLog.cpp b/src/Storages/StorageStripeLog.cpp
index f47eeb60918..48389dccf48 100644
--- a/src/Storages/StorageStripeLog.cpp
+++ b/src/Storages/StorageStripeLog.cpp
@@ -371,8 +371,7 @@ Pipe StorageStripeLog::read(
         = std::make_shared<IndexForNativeFormat>(indices.extractIndexForColumns(NameSet{column_names.begin(), column_names.end()}));
 
     size_t size = indices_for_selected_columns->blocks.size();
-    if (num_streams > size)
-        num_streams = size;
+    num_streams = std::min(num_streams, size);
 
     ReadSettings read_settings = local_context->getReadSettings();
     Pipes pipes;
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index 679946f9aee..8a71a771367 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -1142,8 +1142,7 @@ void ReadFromURL::createIterator(const ActionsDAG::Node * predicate)
             return getFailoverOptions(next_uri, max_addresses);
         });
 
-        if (num_streams > glob_iterator->size())
-            num_streams = glob_iterator->size();
+        num_streams = std::min(num_streams, glob_iterator->size());
     }
     else
     {
diff --git a/src/Storages/WindowView/StorageWindowView.cpp b/src/Storages/WindowView/StorageWindowView.cpp
index 04c26053dba..a9ec1f6c694 100644
--- a/src/Storages/WindowView/StorageWindowView.cpp
+++ b/src/Storages/WindowView/StorageWindowView.cpp
@@ -963,8 +963,7 @@ void StorageWindowView::addFireSignal(std::set<UInt32> & signals)
 void StorageWindowView::updateMaxTimestamp(UInt32 timestamp)
 {
     std::lock_guard lock(fire_signal_mutex);
-    if (timestamp > max_timestamp)
-        max_timestamp = timestamp;
+    max_timestamp = std::max(timestamp, max_timestamp);
 }
 
 void StorageWindowView::updateMaxWatermark(UInt32 watermark)
@@ -1454,8 +1453,7 @@ void StorageWindowView::writeIntoWindowView(
             UInt32 watermark_lower_bound
                 = addTime(t_max_watermark, window_view.slide_kind, -window_view.slide_num_units, *window_view.time_zone);
 
-            if (watermark_lower_bound < lateness_bound)
-                lateness_bound = watermark_lower_bound;
+            lateness_bound = std::min(watermark_lower_bound, lateness_bound);
         }
     }
     else if (!window_view.is_time_column_func_now)
@@ -1551,10 +1549,7 @@ void StorageWindowView::writeIntoWindowView(
             const auto & timestamp_column = *block.getByName(window_view.timestamp_column_name).column;
             const auto & timestamp_data = typeid_cast<const ColumnUInt32 &>(timestamp_column).getData();
             for (const auto & timestamp : timestamp_data)
-            {
-                if (timestamp > block_max_timestamp)
-                    block_max_timestamp = timestamp;
-            }
+                block_max_timestamp = std::max(timestamp, block_max_timestamp);
         }
 
         if (block_max_timestamp)
diff --git a/src/Storages/registerStorages.cpp b/src/Storages/registerStorages.cpp
index dea9feaf28b..ce07c8e8d3e 100644
--- a/src/Storages/registerStorages.cpp
+++ b/src/Storages/registerStorages.cpp
@@ -31,8 +31,6 @@ void registerStorageFuzzJSON(StorageFactory & factory);
 
 #if USE_AWS_S3
 void registerStorageS3(StorageFactory & factory);
-void registerStorageCOS(StorageFactory & factory);
-void registerStorageOSS(StorageFactory & factory);
 void registerStorageHudi(StorageFactory & factory);
 void registerStorageS3Queue(StorageFactory & factory);
 
@@ -132,8 +130,6 @@ void registerStorages()
 
 #if USE_AWS_S3
     registerStorageS3(factory);
-    registerStorageCOS(factory);
-    registerStorageOSS(factory);
     registerStorageHudi(factory);
     registerStorageS3Queue(factory);
 

From a6543a1c48650c9279d8c30247971a18e4e11851 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 05:07:37 +0200
Subject: [PATCH 206/289] Useless changes

---
 src/Formats/JSONUtils.cpp                                | 1 -
 src/Formats/ProtobufSerializer.cpp                       | 9 ++-------
 src/Processors/Executors/ExecutorTasks.cpp               | 3 +--
 src/Processors/Executors/PipelineExecutor.cpp            | 3 +--
 src/Processors/Formats/Impl/FormRowInputFormat.cpp       | 5 ++---
 .../Formats/Impl/NativeORCBlockInputFormat.cpp           | 2 +-
 src/Processors/Formats/Impl/VerticalRowOutputFormat.cpp  | 6 +-----
 .../Formats/RowInputFormatWithDiagnosticInfo.cpp         | 6 ++----
 .../Transforms/DistinctSortedChunkTransform.cpp          | 3 +--
 src/Processors/Transforms/WatermarkTransform.cpp         | 3 +--
 src/Server/GRPCServer.cpp                                | 2 +-
 11 files changed, 13 insertions(+), 30 deletions(-)

diff --git a/src/Formats/JSONUtils.cpp b/src/Formats/JSONUtils.cpp
index 4eb652a5c02..f0985f4a6b7 100644
--- a/src/Formats/JSONUtils.cpp
+++ b/src/Formats/JSONUtils.cpp
@@ -207,7 +207,6 @@ namespace JSONUtils
         skipWhitespaceIfAny(in);
         bool first = true;
         NamesAndTypesList names_and_types;
-        String field;
         while (!in.eof() && *in.position() != '}')
         {
             if (!first)
diff --git a/src/Formats/ProtobufSerializer.cpp b/src/Formats/ProtobufSerializer.cpp
index 53ac0d56653..74c33e3a1d8 100644
--- a/src/Formats/ProtobufSerializer.cpp
+++ b/src/Formats/ProtobufSerializer.cpp
@@ -1719,9 +1719,7 @@ namespace
             ReadBufferFromString buf{str};
             time_t tm = 0;
             readDateTimeText(tm, buf, lut);
-            if (tm < 0)
-                tm = 0;
-            return tm;
+            return std::max<time_t>(tm, 0);
         }
     };
 
@@ -3791,10 +3789,7 @@ namespace
                 }
                 int max_abs = std::abs(enum_descriptor->value(0)->number());
                 for (int i = 1; i != enum_descriptor->value_count(); ++i)
-                {
-                    if (std::abs(enum_descriptor->value(i)->number()) > max_abs)
-                        max_abs = std::abs(enum_descriptor->value(i)->number());
-                }
+                    max_abs = std::max(std::abs(enum_descriptor->value(i)->number()), max_abs);
                 if (max_abs < 128)
                     return NameAndTypePair{field_descriptor->name(), getEnumDataType<Int8>(enum_descriptor)};
                 else if (max_abs < 32768)
diff --git a/src/Processors/Executors/ExecutorTasks.cpp b/src/Processors/Executors/ExecutorTasks.cpp
index 1039cf0e97a..7e3bee239ef 100644
--- a/src/Processors/Executors/ExecutorTasks.cpp
+++ b/src/Processors/Executors/ExecutorTasks.cpp
@@ -192,8 +192,7 @@ void ExecutorTasks::fill(Queue & queue)
 void ExecutorTasks::upscale(size_t use_threads_)
 {
     std::lock_guard lock(mutex);
-    if (use_threads < use_threads_)
-        use_threads = use_threads_;
+    use_threads = std::max(use_threads, use_threads_);
 }
 
 void ExecutorTasks::processAsyncTasks()
diff --git a/src/Processors/Executors/PipelineExecutor.cpp b/src/Processors/Executors/PipelineExecutor.cpp
index 5b5880759e6..49ec9999521 100644
--- a/src/Processors/Executors/PipelineExecutor.cpp
+++ b/src/Processors/Executors/PipelineExecutor.cpp
@@ -100,8 +100,7 @@ void PipelineExecutor::finish()
 void PipelineExecutor::execute(size_t num_threads, bool concurrency_control)
 {
     checkTimeLimit();
-    if (num_threads < 1)
-        num_threads = 1;
+    num_threads = std::max<size_t>(num_threads, 1);
 
     OpenTelemetry::SpanHolder span("PipelineExecutor::execute()");
     span.addAttribute("clickhouse.thread_num", num_threads);
diff --git a/src/Processors/Formats/Impl/FormRowInputFormat.cpp b/src/Processors/Formats/Impl/FormRowInputFormat.cpp
index 448c9e52cce..d3c6f3798cc 100644
--- a/src/Processors/Formats/Impl/FormRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/FormRowInputFormat.cpp
@@ -131,7 +131,8 @@ FormSchemaReader::FormSchemaReader(ReadBuffer & in_, const FormatSettings & form
 NamesAndTypesList readRowAndGetNamesAndDataTypesForFormRow(ReadBuffer & in, const FormatSettings & settings)
 {
     NamesAndTypesList names_and_types;
-    String field, value, decoded_value;
+    String value;
+    String decoded_value;
     do
     {
         auto name = readFieldName(in);
@@ -175,5 +176,3 @@ void registerFormSchemaReader(FormatFactory & factory)
 }
 
 }
-
-
diff --git a/src/Processors/Formats/Impl/NativeORCBlockInputFormat.cpp b/src/Processors/Formats/Impl/NativeORCBlockInputFormat.cpp
index 2fa5c1d2850..0b55f633c6a 100644
--- a/src/Processors/Formats/Impl/NativeORCBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/NativeORCBlockInputFormat.cpp
@@ -1548,7 +1548,7 @@ static ColumnWithTypeAndName readColumnFromORCColumn(
                         if (pos)
                             nested_type_hint = tuple_type_hint->getElement(*pos);
                     }
-                    else if (size_t(i) < tuple_type_hint->getElements().size())
+                    else if (i < tuple_type_hint->getElements().size())
                         nested_type_hint = tuple_type_hint->getElement(i);
                 }
 
diff --git a/src/Processors/Formats/Impl/VerticalRowOutputFormat.cpp b/src/Processors/Formats/Impl/VerticalRowOutputFormat.cpp
index cfaefbe663b..4852af9f0c8 100644
--- a/src/Processors/Formats/Impl/VerticalRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/VerticalRowOutputFormat.cpp
@@ -21,17 +21,13 @@ VerticalRowOutputFormat::VerticalRowOutputFormat(
     Widths name_widths(columns);
     size_t max_name_width = 0;
 
-    String serialized_value;
-
     for (size_t i = 0; i < columns; ++i)
     {
         /// Note that number of code points is just a rough approximation of visible string width.
         const String & name = sample.getByPosition(i).name;
 
         name_widths[i] = UTF8::computeWidth(reinterpret_cast<const UInt8 *>(name.data()), name.size());
-
-        if (name_widths[i] > max_name_width)
-            max_name_width = name_widths[i];
+        max_name_width = std::max(name_widths[i], max_name_width);
     }
 
     names_and_paddings.resize(columns);
diff --git a/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp b/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
index fcf338577f8..c1dd77aecaf 100644
--- a/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
+++ b/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
@@ -57,13 +57,11 @@ std::pair<String, String> RowInputFormatWithDiagnosticInfo::getDiagnosticAndRawD
 
     max_length_of_column_name = 0;
     for (size_t i = 0; i < header.columns(); ++i)
-        if (header.safeGetByPosition(i).name.size() > max_length_of_column_name)
-            max_length_of_column_name = header.safeGetByPosition(i).name.size();
+        max_length_of_column_name = std::max(header.safeGetByPosition(i).name.size(), max_length_of_column_name);
 
     max_length_of_data_type_name = 0;
     for (size_t i = 0; i < header.columns(); ++i)
-        if (header.safeGetByPosition(i).type->getName().size() > max_length_of_data_type_name)
-            max_length_of_data_type_name = header.safeGetByPosition(i).type->getName().size();
+        max_length_of_data_type_name = std::max(header.safeGetByPosition(i).type->getName().size(), max_length_of_data_type_name);
 
     /// Roll back the cursor to the beginning of the previous or current row and parse all over again. But now we derive detailed information.
 
diff --git a/src/Processors/Transforms/DistinctSortedChunkTransform.cpp b/src/Processors/Transforms/DistinctSortedChunkTransform.cpp
index 04741a6f231..281afbd7949 100644
--- a/src/Processors/Transforms/DistinctSortedChunkTransform.cpp
+++ b/src/Processors/Transforms/DistinctSortedChunkTransform.cpp
@@ -154,8 +154,7 @@ size_t DistinctSortedChunkTransform::getRangeEnd(size_t begin, size_t end, Predi
 
     const size_t linear_probe_threadhold = 16;
     size_t linear_probe_end = begin + linear_probe_threadhold;
-    if (linear_probe_end > end)
-        linear_probe_end = end;
+    linear_probe_end = std::min(linear_probe_end, end);
 
     for (size_t pos = begin; pos < linear_probe_end; ++pos)
     {
diff --git a/src/Processors/Transforms/WatermarkTransform.cpp b/src/Processors/Transforms/WatermarkTransform.cpp
index bd2e2b8d363..751b99cd4ee 100644
--- a/src/Processors/Transforms/WatermarkTransform.cpp
+++ b/src/Processors/Transforms/WatermarkTransform.cpp
@@ -38,8 +38,7 @@ void WatermarkTransform::transform(Chunk & chunk)
     const ColumnUInt32::Container & window_end_data = static_cast<const ColumnUInt32 &>(*window_column).getData();
     for (const auto & ts : window_end_data)
     {
-        if (ts > max_watermark)
-            max_watermark = ts;
+        max_watermark = std::max(ts, max_watermark);
         if (lateness_upper_bound && ts <= lateness_upper_bound)
             late_signals.insert(ts);
     }
diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index 0b8692a6751..43252555ef8 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -596,7 +596,7 @@ namespace
             std::tie(new_pos, new_size) = callback();
             if (!new_size)
                 return false;
-            BufferBase::set(static_cast<BufferBase::Position>(const_cast<char *>(new_pos)), new_size, 0);
+            BufferBase::set(static_cast<BufferBase::Position>(const_cast<char *>(static_cast<const char *>(new_pos))), new_size, 0);
             return true;
         }
 

From 9ae3454cd11a0c8837a26430261e999057872d47 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 05:12:11 +0200
Subject: [PATCH 207/289] Useless changes

---
 src/Processors/QueryPlan/ExpressionStep.cpp            | 1 -
 src/Processors/QueryPlan/FilterStep.cpp                | 1 -
 src/Processors/QueryPlan/LimitStep.cpp                 | 1 -
 src/Processors/QueryPlan/MergingAggregatedStep.cpp     | 4 ++--
 src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp | 5 +----
 src/Processors/QueryPlan/ReadFromMergeTree.cpp         | 3 +--
 src/Processors/Sources/MySQLSource.cpp                 | 4 +---
 src/Processors/Transforms/FillingTransform.cpp         | 3 +--
 src/Processors/Transforms/WindowTransform.cpp          | 3 +--
 9 files changed, 7 insertions(+), 18 deletions(-)

diff --git a/src/Processors/QueryPlan/ExpressionStep.cpp b/src/Processors/QueryPlan/ExpressionStep.cpp
index 5062ff5479e..0ccb0c4492a 100644
--- a/src/Processors/QueryPlan/ExpressionStep.cpp
+++ b/src/Processors/QueryPlan/ExpressionStep.cpp
@@ -83,7 +83,6 @@ void ExpressionStep::updateOutputStream()
     const auto & input_sort_description = getInputStreams().front().sort_description;
     for (size_t i = 0, s = input_sort_description.size(); i < s; ++i)
     {
-        String alias;
         const auto & original_column = input_sort_description[i].column_name;
         const auto * alias_node = alias_finder.find(original_column);
         if (alias_node)
diff --git a/src/Processors/QueryPlan/FilterStep.cpp b/src/Processors/QueryPlan/FilterStep.cpp
index 1b9b47f46ac..56b31b2c8ba 100644
--- a/src/Processors/QueryPlan/FilterStep.cpp
+++ b/src/Processors/QueryPlan/FilterStep.cpp
@@ -113,7 +113,6 @@ void FilterStep::updateOutputStream()
     const auto & input_sort_description = getInputStreams().front().sort_description;
     for (size_t i = 0, s = input_sort_description.size(); i < s; ++i)
     {
-        String alias;
         const auto & original_column = input_sort_description[i].column_name;
         const auto * alias_node = alias_finder.find(original_column);
         if (alias_node)
diff --git a/src/Processors/QueryPlan/LimitStep.cpp b/src/Processors/QueryPlan/LimitStep.cpp
index 5e5a7387832..2e2c5ed7c1e 100644
--- a/src/Processors/QueryPlan/LimitStep.cpp
+++ b/src/Processors/QueryPlan/LimitStep.cpp
@@ -53,7 +53,6 @@ void LimitStep::describeActions(FormatSettings & settings) const
     {
         settings.out << prefix;
 
-        String str;
         if (with_ties)
             settings.out << "WITH TIES";
 
diff --git a/src/Processors/QueryPlan/MergingAggregatedStep.cpp b/src/Processors/QueryPlan/MergingAggregatedStep.cpp
index 476f5541812..a8c70e1a9b5 100644
--- a/src/Processors/QueryPlan/MergingAggregatedStep.cpp
+++ b/src/Processors/QueryPlan/MergingAggregatedStep.cpp
@@ -133,8 +133,8 @@ void MergingAggregatedStep::transformPipeline(QueryPipelineBuilder & pipeline, c
     else
     {
         auto num_merge_threads = memory_efficient_merge_threads
-                                 ? static_cast<size_t>(memory_efficient_merge_threads)
-                                 : static_cast<size_t>(max_threads);
+                                 ? memory_efficient_merge_threads
+                                 : max_threads;
 
         pipeline.addMergingAggregatedMemoryEfficientTransform(transform_params, num_merge_threads);
     }
diff --git a/src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp b/src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp
index 22ad53a39e0..2e7693b1b36 100644
--- a/src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromMemoryStorageStep.cpp
@@ -158,10 +158,7 @@ Pipe ReadFromMemoryStorageStep::makePipe()
     }
 
     size_t size = current_data->size();
-
-    if (num_streams > size)
-        num_streams = size;
-
+    num_streams = std::min(num_streams, size);
     Pipes pipes;
 
     auto parallel_execution_index = std::make_shared<std::atomic<size_t>>(0);
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index bbd7185c440..68b145f259d 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -1187,8 +1187,7 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
     PartRangesReadInfo info(parts_with_ranges, settings, *data_settings);
 
     assert(num_streams == requested_num_streams);
-    if (num_streams > settings.max_final_threads)
-        num_streams = settings.max_final_threads;
+    num_streams = std::min<size_t>(num_streams, settings.max_final_threads);
 
     /// If setting do_not_merge_across_partitions_select_final is true than we won't merge parts from different partitions.
     /// We have all parts in parts vector, where parts with same partition are nearby.
diff --git a/src/Processors/Sources/MySQLSource.cpp b/src/Processors/Sources/MySQLSource.cpp
index be691fd5b2e..985a82a7b17 100644
--- a/src/Processors/Sources/MySQLSource.cpp
+++ b/src/Processors/Sources/MySQLSource.cpp
@@ -241,8 +241,7 @@ namespace
                 ReadBufferFromString in(value);
                 time_t time = 0;
                 readDateTimeText(time, in, assert_cast<const DataTypeDateTime &>(data_type).getTimeZone());
-                if (time < 0)
-                    time = 0;
+                time = std::max<time_t>(time, 0);
                 assert_cast<ColumnUInt32 &>(column).insertValue(static_cast<UInt32>(time));
                 read_bytes_size += 4;
                 break;
@@ -275,7 +274,6 @@ namespace
                 /// 8 bytes for double-precision X coordinate
                 /// 8 bytes for double-precision Y coordinate
                 ReadBufferFromMemory payload(value.data(), value.size());
-                String val;
                 payload.ignore(4);
 
                 UInt8 endian;
diff --git a/src/Processors/Transforms/FillingTransform.cpp b/src/Processors/Transforms/FillingTransform.cpp
index 879d61bb241..05fd2a7254f 100644
--- a/src/Processors/Transforms/FillingTransform.cpp
+++ b/src/Processors/Transforms/FillingTransform.cpp
@@ -545,8 +545,7 @@ size_t getRangeEnd(size_t begin, size_t end, Predicate pred)
 
     const size_t linear_probe_threadhold = 16;
     size_t linear_probe_end = begin + linear_probe_threadhold;
-    if (linear_probe_end > end)
-        linear_probe_end = end;
+    linear_probe_end = std::min(linear_probe_end, end);
 
     for (size_t pos = begin; pos < linear_probe_end; ++pos)
     {
diff --git a/src/Processors/Transforms/WindowTransform.cpp b/src/Processors/Transforms/WindowTransform.cpp
index f43b9a2e794..eb15636b818 100644
--- a/src/Processors/Transforms/WindowTransform.cpp
+++ b/src/Processors/Transforms/WindowTransform.cpp
@@ -1630,8 +1630,7 @@ struct StatefulWindowFunction : public WindowFunction
 
     void destroy(AggregateDataPtr __restrict place) const noexcept override
     {
-        auto * const state = static_cast<State *>(static_cast<void *>(place));
-        state->~State();
+        reinterpret_cast<State *>(place)->~State();
     }
 
     bool hasTrivialDestructor() const override { return std::is_trivially_destructible_v<State>; }

From 46c99476d0623a80ed91ffe309004a2486ddd334 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 05:23:47 +0200
Subject: [PATCH 208/289] Useless changes

---
 src/Coordination/Changelog.cpp                            | 2 +-
 src/Coordination/InMemoryLogStore.cpp                     | 2 +-
 src/Coordination/KeeperLogStore.cpp                       | 2 +-
 src/Coordination/KeeperServer.cpp                         | 8 ++++----
 src/Coordination/KeeperStateManager.cpp                   | 2 +-
 src/Coordination/KeeperStorage.cpp                        | 4 ++++
 .../UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp | 1 -
 src/Processors/Formats/Impl/Parquet/Write.cpp             | 2 +-
 src/Processors/QueryPlan/MergingAggregatedStep.cpp        | 2 +-
 src/Processors/Transforms/WindowTransform.cpp             | 2 +-
 10 files changed, 15 insertions(+), 12 deletions(-)

diff --git a/src/Coordination/Changelog.cpp b/src/Coordination/Changelog.cpp
index 58d396aad88..ad6f95b3902 100644
--- a/src/Coordination/Changelog.cpp
+++ b/src/Coordination/Changelog.cpp
@@ -2262,7 +2262,7 @@ nuraft::ptr<nuraft::buffer> Changelog::serializeEntriesToBuffer(uint64_t index,
 
     nuraft::ptr<nuraft::buffer> buf_out = nuraft::buffer::alloc(sizeof(int32_t) + count * sizeof(int32_t) + size_total);
     buf_out->pos(0);
-    buf_out->put(static_cast<int32_t>(count));
+    buf_out->put(count);
 
     for (auto & entry : returned_logs)
     {
diff --git a/src/Coordination/InMemoryLogStore.cpp b/src/Coordination/InMemoryLogStore.cpp
index 32aaf8e0d4a..1e54bb1ac5c 100644
--- a/src/Coordination/InMemoryLogStore.cpp
+++ b/src/Coordination/InMemoryLogStore.cpp
@@ -136,7 +136,7 @@ nuraft::ptr<nuraft::buffer> InMemoryLogStore::pack(uint64_t index, Int32 cnt)
 
     nuraft::ptr<buffer> buf_out = nuraft::buffer::alloc(sizeof(int32) + cnt * sizeof(int32) + uint64_total);
     buf_out->pos(0);
-    buf_out->put(static_cast<Int32>(cnt));
+    buf_out->put(cnt);
 
     for (auto & entry : returned_logs)
     {
diff --git a/src/Coordination/KeeperLogStore.cpp b/src/Coordination/KeeperLogStore.cpp
index 820039d8a8f..803d2b06c04 100644
--- a/src/Coordination/KeeperLogStore.cpp
+++ b/src/Coordination/KeeperLogStore.cpp
@@ -145,7 +145,7 @@ uint64_t KeeperLogStore::last_durable_index()
 void KeeperLogStore::setRaftServer(const nuraft::ptr<nuraft::raft_server> & raft_server)
 {
     std::lock_guard lock(changelog_lock);
-    return changelog.setRaftServer(raft_server);
+    changelog.setRaftServer(raft_server);
 }
 
 void KeeperLogStore::getKeeperLogInfo(KeeperLogInfo & log_info) const
diff --git a/src/Coordination/KeeperServer.cpp b/src/Coordination/KeeperServer.cpp
index 57dc9596038..068dc691e60 100644
--- a/src/Coordination/KeeperServer.cpp
+++ b/src/Coordination/KeeperServer.cpp
@@ -1029,9 +1029,9 @@ void KeeperServer::applyConfigUpdateWithReconfigDisabled(const ClusterUpdateActi
         for (size_t i = 0; i < coordination_settings->configuration_change_tries_count && !is_recovering; ++i)
         {
             if (raft_instance->get_srv_config(add->id) != nullptr)
-                return applied();
+                return applied(); // NOLINT
             if (!isLeader())
-                return not_leader();
+                return not_leader(); // NOLINT
             if (!raft_instance->add_srv(static_cast<nuraft::srv_config>(*add))->get_accepted())
                 backoff_on_refusal(i);
         }
@@ -1050,9 +1050,9 @@ void KeeperServer::applyConfigUpdateWithReconfigDisabled(const ClusterUpdateActi
         for (size_t i = 0; i < coordination_settings->configuration_change_tries_count && !is_recovering; ++i)
         {
             if (raft_instance->get_srv_config(remove->id) == nullptr)
-                return applied();
+                return applied(); // NOLINT
             if (!isLeader())
-                return not_leader();
+                return not_leader(); // NOLINT
             if (!raft_instance->remove_srv(remove->id)->get_accepted())
                 backoff_on_refusal(i);
         }
diff --git a/src/Coordination/KeeperStateManager.cpp b/src/Coordination/KeeperStateManager.cpp
index c30df0b6313..05290c04041 100644
--- a/src/Coordination/KeeperStateManager.cpp
+++ b/src/Coordination/KeeperStateManager.cpp
@@ -508,7 +508,7 @@ ClusterUpdateActions KeeperStateManager::getRaftConfigurationDiff(
     }
 
     /// After that remove old ones
-    for (auto [old_id, server_config] : old_ids)
+    for (const auto & [old_id, server_config] : old_ids)
         if (!new_ids.contains(old_id))
             result.emplace_back(RemoveRaftServer{old_id});
 
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index a5e062a5aa6..53d4ef5f849 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -1,3 +1,5 @@
+// NOLINTBEGIN(clang-analyzer-optin.core.EnumCastOutOfRange)
+
 #include <iterator>
 #include <variant>
 #include <IO/Operators.h>
@@ -2708,3 +2710,5 @@ String KeeperStorage::generateDigest(const String & userdata)
 
 
 }
+
+// NOLINTEND(clang-analyzer-optin.core.EnumCastOutOfRange)
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
index 4ec34c15efc..568e0b9b5d2 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
@@ -298,7 +298,6 @@ bool UserDefinedSQLObjectsZooKeeperStorage::getObjectDataAndSetWatch(
     };
 
     Coordination::Stat entity_stat;
-    String object_create_query;
     return zookeeper->tryGetWatch(path, data, &entity_stat, object_watcher);
 }
 
diff --git a/src/Processors/Formats/Impl/Parquet/Write.cpp b/src/Processors/Formats/Impl/Parquet/Write.cpp
index 4d71e0102d8..b1e231d7749 100644
--- a/src/Processors/Formats/Impl/Parquet/Write.cpp
+++ b/src/Processors/Formats/Impl/Parquet/Write.cpp
@@ -436,7 +436,7 @@ PODArray<char> & compress(PODArray<char> & source, PODArray<char> & scratch, Com
             size_t compressed_size;
             snappy::RawCompress(source.data(), source.size(), scratch.data(), &compressed_size);
 
-            scratch.resize(static_cast<size_t>(compressed_size));
+            scratch.resize(compressed_size);
             return scratch;
         }
 #endif
diff --git a/src/Processors/QueryPlan/MergingAggregatedStep.cpp b/src/Processors/QueryPlan/MergingAggregatedStep.cpp
index a8c70e1a9b5..a5062ac8216 100644
--- a/src/Processors/QueryPlan/MergingAggregatedStep.cpp
+++ b/src/Processors/QueryPlan/MergingAggregatedStep.cpp
@@ -144,7 +144,7 @@ void MergingAggregatedStep::transformPipeline(QueryPipelineBuilder & pipeline, c
 
 void MergingAggregatedStep::describeActions(FormatSettings & settings) const
 {
-    return params.explain(settings.out, settings.offset);
+    params.explain(settings.out, settings.offset);
 }
 
 void MergingAggregatedStep::describeActions(JSONBuilder::JSONMap & map) const
diff --git a/src/Processors/Transforms/WindowTransform.cpp b/src/Processors/Transforms/WindowTransform.cpp
index eb15636b818..06293bc4eb3 100644
--- a/src/Processors/Transforms/WindowTransform.cpp
+++ b/src/Processors/Transforms/WindowTransform.cpp
@@ -1637,7 +1637,7 @@ struct StatefulWindowFunction : public WindowFunction
 
     State & getState(const WindowFunctionWorkspace & workspace) const
     {
-        return *static_cast<State *>(static_cast<void *>(workspace.aggregate_function_state.data()));
+        return *reinterpret_cast<State *>(workspace.aggregate_function_state.data());
     }
 };
 

From ced5cc1644325728a25254861bb482ceac0980e4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 05:55:04 +0200
Subject: [PATCH 209/289] Useless changes

---
 base/base/EnumReflection.h                    |  2 +-
 .../ZooKeeper/ZooKeeperWithFaultInjection.cpp | 22 +++++++++----------
 src/Common/mysqlxx/PoolFactory.cpp            |  1 -
 src/Coordination/KeeperServer.cpp             |  3 ++-
 src/Coordination/KeeperStorage.cpp            |  8 +++----
 src/Dictionaries/HierarchyDictionariesUtils.h |  2 +-
 src/Dictionaries/RegExpTreeDictionary.cpp     |  1 -
 src/Functions/DateTimeTransforms.h            | 16 +++++++-------
 src/Functions/FunctionFile.cpp                |  2 +-
 src/Functions/FunctionMathBinaryFloat64.h     |  2 +-
 src/Functions/FunctionsConversion.cpp         |  3 +--
 src/Functions/FunctionsHashing.h              |  2 +-
 src/Functions/FunctionsJSON.h                 |  3 +--
 src/Functions/GeoHash.cpp                     |  2 +-
 src/Functions/URL/URLHierarchy.cpp            |  2 +-
 src/Functions/castTypeToEither.h              |  2 +-
 src/Functions/formatDateTime.cpp              |  9 ++++----
 17 files changed, 38 insertions(+), 44 deletions(-)

diff --git a/base/base/EnumReflection.h b/base/base/EnumReflection.h
index e3208f16a75..4a9de4d17a3 100644
--- a/base/base/EnumReflection.h
+++ b/base/base/EnumReflection.h
@@ -11,7 +11,7 @@ namespace detail
 template <is_enum E, class F, size_t ...I>
 constexpr void static_for(F && f, std::index_sequence<I...>)
 {
-    (std::forward<F>(f)(std::integral_constant<E, magic_enum::enum_value<E>(I)>()) , ...);
+    (f(std::integral_constant<E, magic_enum::enum_value<E>(I)>()) , ...);
 }
 }
 
diff --git a/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.cpp b/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.cpp
index e6c3be50e61..fc246e263d9 100644
--- a/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.cpp
@@ -277,12 +277,12 @@ zkutil::ZooKeeper::MultiTryGetResponse ZooKeeperWithFaultInjection::tryGet(const
 
 void ZooKeeperWithFaultInjection::set(const String & path, const String & data, int32_t version, Coordination::Stat * stat)
 {
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->set(path, data, version, stat); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->set(path, data, version, stat); });
 }
 
 void ZooKeeperWithFaultInjection::remove(const String & path, int32_t version)
 {
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->remove(path, version); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->remove(path, version); });
 }
 
 bool ZooKeeperWithFaultInjection::exists(const std::string & path, Coordination::Stat * stat, const zkutil::EventPtr & watch)
@@ -352,18 +352,18 @@ Coordination::Responses ZooKeeperWithFaultInjection::multi(const Coordination::R
 
 void ZooKeeperWithFaultInjection::createIfNotExists(const std::string & path, const std::string & data)
 {
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->createIfNotExists(path, data); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->createIfNotExists(path, data); });
 }
 
 void ZooKeeperWithFaultInjection::createOrUpdate(const std::string & path, const std::string & data, int32_t mode)
 {
     chassert(mode != zkutil::CreateMode::EphemeralSequential && mode != zkutil::CreateMode::Ephemeral);
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->createOrUpdate(path, data, mode); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->createOrUpdate(path, data, mode); });
 }
 
 void ZooKeeperWithFaultInjection::createAncestors(const std::string & path)
 {
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->createAncestors(path); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->createAncestors(path); });
 }
 
 Coordination::Error ZooKeeperWithFaultInjection::tryRemove(const std::string & path, int32_t version)
@@ -373,17 +373,17 @@ Coordination::Error ZooKeeperWithFaultInjection::tryRemove(const std::string & p
 
 void ZooKeeperWithFaultInjection::removeRecursive(const std::string & path)
 {
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->removeRecursive(path); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->removeRecursive(path); });
 }
 
 void ZooKeeperWithFaultInjection::tryRemoveRecursive(const std::string & path)
 {
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->tryRemoveRecursive(path); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->tryRemoveRecursive(path); });
 }
 
 void ZooKeeperWithFaultInjection::removeChildren(const std::string & path)
 {
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->removeChildren(path); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->removeChildren(path); });
 }
 
 bool ZooKeeperWithFaultInjection::tryRemoveChildrenRecursive(
@@ -410,14 +410,14 @@ ZooKeeperWithFaultInjection::trySet(const std::string & path, const std::string
 
 void ZooKeeperWithFaultInjection::checkExistsAndGetCreateAncestorsOps(const std::string & path, Coordination::Requests & requests)
 {
-    return executeWithFaultSync(__func__, path, [&]() { return keeper->checkExistsAndGetCreateAncestorsOps(path, requests); });
+    executeWithFaultSync(__func__, path, [&]() { keeper->checkExistsAndGetCreateAncestorsOps(path, requests); });
 }
 
 void ZooKeeperWithFaultInjection::deleteEphemeralNodeIfContentMatches(
     const std::string & path, const std::string & fast_delete_if_equal_value)
 {
-    return executeWithFaultSync(
-        __func__, path, [&]() { return keeper->deleteEphemeralNodeIfContentMatches(path, fast_delete_if_equal_value); });
+    executeWithFaultSync(
+        __func__, path, [&]() { keeper->deleteEphemeralNodeIfContentMatches(path, fast_delete_if_equal_value); });
 }
 
 Coordination::Error ZooKeeperWithFaultInjection::tryMulti(const Coordination::Requests & requests, Coordination::Responses & responses, bool check_session_valid)
diff --git a/src/Common/mysqlxx/PoolFactory.cpp b/src/Common/mysqlxx/PoolFactory.cpp
index 9479273e36e..77a549b7a11 100644
--- a/src/Common/mysqlxx/PoolFactory.cpp
+++ b/src/Common/mysqlxx/PoolFactory.cpp
@@ -37,7 +37,6 @@ static std::string getPoolEntryName(const Poco::Util::AbstractConfiguration & co
     std::string port = config.getString(config_name + ".port", "");
     std::string user = config.getString(config_name + ".user", "");
     std::string db = config.getString(config_name + ".db", "");
-    std::string table = config.getString(config_name + ".table", "");
 
     Poco::Util::AbstractConfiguration::Keys keys;
     config.keys(config_name, keys);
diff --git a/src/Coordination/KeeperServer.cpp b/src/Coordination/KeeperServer.cpp
index 068dc691e60..8d21ce2ab01 100644
--- a/src/Coordination/KeeperServer.cpp
+++ b/src/Coordination/KeeperServer.cpp
@@ -1044,7 +1044,8 @@ void KeeperServer::applyConfigUpdateWithReconfigDisabled(const ClusterUpdateActi
                 "Trying to remove leader node (ourself), so will yield leadership and some other node "
                 "(new leader) will try to remove us. "
                 "Probably you will have to run SYSTEM RELOAD CONFIG on the new leader node");
-            return raft_instance->yield_leadership();
+            raft_instance->yield_leadership();
+            return;
         }
 
         for (size_t i = 0; i < coordination_settings->configuration_change_tries_count && !is_recovering; ++i)
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 53d4ef5f849..df5c2e9e0c8 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -1174,8 +1174,7 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
             else if (parent_cversion > node.cversion)
                 node.cversion = parent_cversion;
 
-            if (zxid > node.pzxid)
-                node.pzxid = zxid;
+            node.pzxid = std::max(zxid, node.pzxid);
             node.increaseNumChildren();
         };
 
@@ -1353,9 +1352,8 @@ struct KeeperStorageRemoveRequestProcessor final : public KeeperStorageRequestPr
                 {
                     [zxid](KeeperStorage::Node & parent)
                     {
-                        if (parent.pzxid < zxid)
-                            parent.pzxid = zxid;
-                   }
+                        parent.pzxid = std::max(parent.pzxid, zxid);
+                    }
                 }
             );
         };
diff --git a/src/Dictionaries/HierarchyDictionariesUtils.h b/src/Dictionaries/HierarchyDictionariesUtils.h
index 4a986153998..e2878a092ae 100644
--- a/src/Dictionaries/HierarchyDictionariesUtils.h
+++ b/src/Dictionaries/HierarchyDictionariesUtils.h
@@ -127,7 +127,7 @@ namespace detail
             auto hierarchy_key = keys[i];
             size_t current_hierarchy_depth = 0;
 
-            bool is_key_valid = std::forward<IsKeyValidFunc>(is_key_valid_func)(hierarchy_key);
+            bool is_key_valid = is_key_valid_func(hierarchy_key);
 
             if (!is_key_valid)
             {
diff --git a/src/Dictionaries/RegExpTreeDictionary.cpp b/src/Dictionaries/RegExpTreeDictionary.cpp
index a3f243b49d7..2e93a8e6001 100644
--- a/src/Dictionaries/RegExpTreeDictionary.cpp
+++ b/src/Dictionaries/RegExpTreeDictionary.cpp
@@ -982,7 +982,6 @@ void registerDictionaryRegExpTree(DictionaryFactory & factory)
                             "to represent regular expressions");
         }
 
-        String dictionary_layout_prefix = config_prefix + ".layout" + ".regexp_tree";
         const DictionaryLifetime dict_lifetime{config, config_prefix + ".lifetime"};
 
         const auto dict_id = StorageID::fromDictionaryConfig(config, config_prefix);
diff --git a/src/Functions/DateTimeTransforms.h b/src/Functions/DateTimeTransforms.h
index d3d3eb3f790..34c59ecab08 100644
--- a/src/Functions/DateTimeTransforms.h
+++ b/src/Functions/DateTimeTransforms.h
@@ -1690,7 +1690,7 @@ struct ToRelativeYearNumImpl
     static auto execute(Int64 t, const DateLUTImpl & time_zone)
     {
         if constexpr (precision_ == ResultPrecision::Extended)
-            return static_cast<Int16>(time_zone.toYear(t));
+            return time_zone.toYear(t);
         else
             return static_cast<UInt16>(time_zone.toYear(t));
     }
@@ -1701,7 +1701,7 @@ struct ToRelativeYearNumImpl
     static auto execute(Int32 d, const DateLUTImpl & time_zone)
     {
         if constexpr (precision_ == ResultPrecision::Extended)
-            return static_cast<Int16>(time_zone.toYear(ExtendedDayNum(d)));
+            return time_zone.toYear(ExtendedDayNum(d));
         else
             return static_cast<UInt16>(time_zone.toYear(ExtendedDayNum(d)));
     }
@@ -1722,7 +1722,7 @@ struct ToRelativeQuarterNumImpl
     static auto execute(Int64 t, const DateLUTImpl & time_zone)
     {
         if constexpr (precision_ == ResultPrecision::Extended)
-            return static_cast<Int32>(time_zone.toRelativeQuarterNum(t));
+            return time_zone.toRelativeQuarterNum(t);
         else
             return static_cast<UInt16>(time_zone.toRelativeQuarterNum(t));
     }
@@ -1733,7 +1733,7 @@ struct ToRelativeQuarterNumImpl
     static auto execute(Int32 d, const DateLUTImpl & time_zone)
     {
         if constexpr (precision_ == ResultPrecision::Extended)
-            return static_cast<Int32>(time_zone.toRelativeQuarterNum(ExtendedDayNum(d)));
+            return time_zone.toRelativeQuarterNum(ExtendedDayNum(d));
         else
             return static_cast<UInt16>(time_zone.toRelativeQuarterNum(ExtendedDayNum(d)));
     }
@@ -1754,7 +1754,7 @@ struct ToRelativeMonthNumImpl
     static auto execute(Int64 t, const DateLUTImpl & time_zone)
     {
         if constexpr (precision_ == ResultPrecision::Extended)
-            return static_cast<Int32>(time_zone.toRelativeMonthNum(t));
+            return time_zone.toRelativeMonthNum(t);
         else
             return static_cast<UInt16>(time_zone.toRelativeMonthNum(t));
     }
@@ -1765,7 +1765,7 @@ struct ToRelativeMonthNumImpl
     static auto execute(Int32 d, const DateLUTImpl & time_zone)
     {
         if constexpr (precision_ == ResultPrecision::Extended)
-            return static_cast<Int32>(time_zone.toRelativeMonthNum(ExtendedDayNum(d)));
+            return time_zone.toRelativeMonthNum(ExtendedDayNum(d));
         else
             return static_cast<UInt16>(time_zone.toRelativeMonthNum(ExtendedDayNum(d)));
     }
@@ -1786,7 +1786,7 @@ struct ToRelativeWeekNumImpl
     static auto execute(Int64 t, const DateLUTImpl & time_zone)
     {
         if constexpr (precision_ == ResultPrecision::Extended)
-            return static_cast<Int32>(time_zone.toRelativeWeekNum(t));
+            return time_zone.toRelativeWeekNum(t);
         else
             return static_cast<UInt16>(time_zone.toRelativeWeekNum(t));
     }
@@ -1797,7 +1797,7 @@ struct ToRelativeWeekNumImpl
     static auto execute(Int32 d, const DateLUTImpl & time_zone)
     {
         if constexpr (precision_ == ResultPrecision::Extended)
-            return static_cast<Int32>(time_zone.toRelativeWeekNum(ExtendedDayNum(d)));
+            return time_zone.toRelativeWeekNum(ExtendedDayNum(d));
         else
             return static_cast<UInt16>(time_zone.toRelativeWeekNum(ExtendedDayNum(d)));
     }
diff --git a/src/Functions/FunctionFile.cpp b/src/Functions/FunctionFile.cpp
index fa7dda82e1c..a87f76f32c3 100644
--- a/src/Functions/FunctionFile.cpp
+++ b/src/Functions/FunctionFile.cpp
@@ -129,7 +129,7 @@ public:
 
             try
             {
-                if (need_check && file_path.string().find(user_files_absolute_path_string) != 0)
+                if (need_check && !file_path.string().starts_with(user_files_absolute_path_string))
                     throw Exception(ErrorCodes::DATABASE_ACCESS_DENIED, "File is not inside {}", user_files_absolute_path.string());
 
                 ReadBufferFromFile in(file_path);
diff --git a/src/Functions/FunctionMathBinaryFloat64.h b/src/Functions/FunctionMathBinaryFloat64.h
index e147f50d2c1..d17e9cf3358 100644
--- a/src/Functions/FunctionMathBinaryFloat64.h
+++ b/src/Functions/FunctionMathBinaryFloat64.h
@@ -221,7 +221,7 @@ struct BinaryFunctionVectorized
     template <typename T1, typename T2>
     static void execute(const T1 * src_left, const T2 * src_right, Float64 * dst)
     {
-        dst[0] = static_cast<Float64>(Function(static_cast<Float64>(src_left[0]), static_cast<Float64>(src_right[0])));
+        dst[0] = Function(static_cast<Float64>(src_left[0]), static_cast<Float64>(src_right[0]));
     }
 };
 
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index b2a90517b73..ce89d4b8e2c 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -133,8 +133,7 @@ struct ToDateTimeImpl
         }
         else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
         {
-            if (d > MAX_DATETIME_DAY_NUM)
-                d = MAX_DATETIME_DAY_NUM;
+            d = std::min<time_t>(d, MAX_DATETIME_DAY_NUM);
         }
         return static_cast<UInt32>(time_zone.fromDayNum(DayNum(d)));
     }
diff --git a/src/Functions/FunctionsHashing.h b/src/Functions/FunctionsHashing.h
index 79b33e2f75b..5b81021be42 100644
--- a/src/Functions/FunctionsHashing.h
+++ b/src/Functions/FunctionsHashing.h
@@ -1392,7 +1392,7 @@ struct URLHierarchyHashImpl
         *    (http, file - fit, mailto, magnet - do not fit), and after two slashes there is still something
         *    For the rest, simply return the full URL as the only element of the hierarchy.
         */
-        if (pos == begin || pos == end || !(*pos++ == ':' && pos < end && *pos++ == '/' && pos < end && *pos++ == '/' && pos < end))
+        if (pos == begin || pos == end || !(pos + 3 < end && pos[0] == ':' && pos[1] == '/' && pos[2] == '/'))
         {
             pos = end;
             return 0 == level ? pos - begin : 0;
diff --git a/src/Functions/FunctionsJSON.h b/src/Functions/FunctionsJSON.h
index a9cf59ce322..8a2ad457d34 100644
--- a/src/Functions/FunctionsJSON.h
+++ b/src/Functions/FunctionsJSON.h
@@ -327,8 +327,7 @@ private:
         for (const auto i : collections::range(0, offsets.size()))
         {
             size_t size = offsets[i] - offsets[i - 1];
-            if (max_size < size)
-                max_size = size;
+            max_size = std::max(max_size, size);
         }
         if (max_size)
             --max_size;
diff --git a/src/Functions/GeoHash.cpp b/src/Functions/GeoHash.cpp
index 62108c52418..bc43916d904 100644
--- a/src/Functions/GeoHash.cpp
+++ b/src/Functions/GeoHash.cpp
@@ -114,7 +114,7 @@ inline Encoded merge(const Encoded & encodedLon, const Encoded & encodedLat, uin
     Encoded result;
     result.fill(0);
 
-    const auto bits = (precision * BITS_PER_SYMBOL) / 2;
+    uint8_t bits = (precision * BITS_PER_SYMBOL) / 2;
     assert(bits < 255);
     uint8_t i = 0;
     for (; i < bits; ++i)
diff --git a/src/Functions/URL/URLHierarchy.cpp b/src/Functions/URL/URLHierarchy.cpp
index a0c78c5c1a2..a1165fbf45e 100644
--- a/src/Functions/URL/URLHierarchy.cpp
+++ b/src/Functions/URL/URLHierarchy.cpp
@@ -67,7 +67,7 @@ public:
              * (http, file - fit, mailto, magnet - do not fit), and after two slashes still at least something is there.
              * For the rest, just return an empty array.
              */
-            if (pos == begin || pos == end || !(*pos++ == ':' && pos < end && *pos++ == '/' && pos < end && *pos++ == '/' && pos < end))
+            if (pos == begin || pos == end || !(pos + 3 < end && pos[0] == ':' && pos[1] == '/' && pos[2] == '/'))
             {
                 pos = end;
                 return false;
diff --git a/src/Functions/castTypeToEither.h b/src/Functions/castTypeToEither.h
index 58b13e350b2..3a2f90a17f8 100644
--- a/src/Functions/castTypeToEither.h
+++ b/src/Functions/castTypeToEither.h
@@ -15,7 +15,7 @@ static bool castTypeToEither(const T * type, F && f)
 template <class ...Args>
 static bool castTypeToEither(TypeList<Args...>, const auto * type, auto && f)
 {
-    return ((typeid_cast<const Args *>(type) != nullptr && std::forward<decltype(f)>(f)(*typeid_cast<const Args *>(type))) || ...);
+    return ((typeid_cast<const Args *>(type) != nullptr && f(*typeid_cast<const Args *>(type))) || ...);
 }
 
 }
diff --git a/src/Functions/formatDateTime.cpp b/src/Functions/formatDateTime.cpp
index 5a992f321f4..f63ecbf6146 100644
--- a/src/Functions/formatDateTime.cpp
+++ b/src/Functions/formatDateTime.cpp
@@ -552,12 +552,12 @@ private:
 
         static size_t jodaEra(size_t min_represent_digits, char * dest, Time source, UInt64, UInt32, const DateLUTImpl & timezone)
         {
-            auto year = static_cast<Int32>(ToYearImpl::execute(source, timezone));
+            Int32 year = static_cast<Int32>(ToYearImpl::execute(source, timezone));
             String res;
             if (min_represent_digits <= 3)
-                res = static_cast<Int32>(year) > 0 ? "AD" : "BC";
+                res = year > 0 ? "AD" : "BC";
             else
-                res = static_cast<Int32>(year) > 0 ? "Anno Domini" : "Before Christ";
+                res = year > 0 ? "Anno Domini" : "Before Christ";
 
             memcpy(dest, res.data(), res.size());
             return res.size();
@@ -689,8 +689,7 @@ private:
 
         static size_t jodaFractionOfSecond(size_t min_represent_digits, char * dest, Time /*source*/, UInt64 fractional_second, UInt32 scale, const DateLUTImpl & /*timezone*/)
         {
-            if (min_represent_digits > 9)
-                min_represent_digits = 9;
+            min_represent_digits = std::min<size_t>(min_represent_digits, 9);
             if (fractional_second == 0)
             {
                 for (UInt64 i = 0; i < min_represent_digits; ++i)

From 3e70f79be7a39c003a2b48526450e85c2cd18420 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 06:25:29 +0200
Subject: [PATCH 210/289] Useless changes

---
 src/Dictionaries/HierarchyDictionariesUtils.h | 2 +-
 src/Dictionaries/RedisSource.cpp              | 3 +--
 src/Dictionaries/SSDCacheDictionaryStorage.h  | 2 +-
 3 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/Dictionaries/HierarchyDictionariesUtils.h b/src/Dictionaries/HierarchyDictionariesUtils.h
index e2878a092ae..fc4d4c09862 100644
--- a/src/Dictionaries/HierarchyDictionariesUtils.h
+++ b/src/Dictionaries/HierarchyDictionariesUtils.h
@@ -167,7 +167,7 @@ namespace detail
                 elements.emplace_back(hierarchy_key);
                 ++current_hierarchy_depth;
 
-                std::optional<UInt64> parent_key = std::forward<GetParentKeyFunc>(get_parent_key_func)(hierarchy_key);
+                std::optional<UInt64> parent_key = get_parent_key_func(hierarchy_key);
 
                 if (!parent_key.has_value())
                     break;
diff --git a/src/Dictionaries/RedisSource.cpp b/src/Dictionaries/RedisSource.cpp
index 719c0278707..3bf02bf854b 100644
--- a/src/Dictionaries/RedisSource.cpp
+++ b/src/Dictionaries/RedisSource.cpp
@@ -99,8 +99,7 @@ namespace DB
                     ReadBufferFromString in(string_value);
                     time_t time = 0;
                     readDateTimeText(time, in);
-                    if (time < 0)
-                        time = 0;
+                    time = std::max<time_t>(time, 0);
                     assert_cast<ColumnUInt32 &>(column).insertValue(static_cast<UInt32>(time));
                     break;
                 }
diff --git a/src/Dictionaries/SSDCacheDictionaryStorage.h b/src/Dictionaries/SSDCacheDictionaryStorage.h
index 73c96e0aedc..b23f9617ec8 100644
--- a/src/Dictionaries/SSDCacheDictionaryStorage.h
+++ b/src/Dictionaries/SSDCacheDictionaryStorage.h
@@ -728,7 +728,7 @@ public:
                         check_sum);
                 }
 
-                std::forward<FetchBlockFunc>(func)(blocks_to_fetch[block_to_fetch_index], block.getBlockData());
+                func(blocks_to_fetch[block_to_fetch_index], block.getBlockData());
 
                 processed[block_to_fetch_index] = true;
             }

From cfbe0f30f0658cf7127d01216b901ce93c451f4e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 06:32:36 +0200
Subject: [PATCH 211/289] Useless changes

---
 src/Dictionaries/PolygonDictionary.cpp                | 4 ++++
 src/Dictionaries/PolygonDictionaryImplementations.cpp | 4 ++++
 src/Dictionaries/PolygonDictionaryUtils.cpp           | 6 ++++--
 3 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/src/Dictionaries/PolygonDictionary.cpp b/src/Dictionaries/PolygonDictionary.cpp
index 1456a0db750..7c67079b09e 100644
--- a/src/Dictionaries/PolygonDictionary.cpp
+++ b/src/Dictionaries/PolygonDictionary.cpp
@@ -1,3 +1,5 @@
+// NOLINTBEGIN // clang-tidy-19 crashes
+
 #include "PolygonDictionary.h"
 
 #include <cmath>
@@ -682,3 +684,5 @@ void IPolygonDictionary::extractPolygons(const ColumnPtr & column)
 }
 
 }
+
+// NOLINTEND
diff --git a/src/Dictionaries/PolygonDictionaryImplementations.cpp b/src/Dictionaries/PolygonDictionaryImplementations.cpp
index 64d29458430..44d5f462ec4 100644
--- a/src/Dictionaries/PolygonDictionaryImplementations.cpp
+++ b/src/Dictionaries/PolygonDictionaryImplementations.cpp
@@ -1,3 +1,5 @@
+// NOLINTBEGIN // clang-tidy-19 crashes
+
 #include "PolygonDictionaryImplementations.h"
 #include "DictionaryFactory.h"
 
@@ -264,3 +266,5 @@ void registerDictionaryPolygon(DictionaryFactory & factory)
 }
 
 }
+
+// NOLINTEND
diff --git a/src/Dictionaries/PolygonDictionaryUtils.cpp b/src/Dictionaries/PolygonDictionaryUtils.cpp
index 8f060fe7b8d..fb641ce5b91 100644
--- a/src/Dictionaries/PolygonDictionaryUtils.cpp
+++ b/src/Dictionaries/PolygonDictionaryUtils.cpp
@@ -1,12 +1,12 @@
+// NOLINTBEGIN // clang-tidy-19 crashes
+
 #include "PolygonDictionaryUtils.h"
 
 #include <Common/ThreadPool.h>
 
 #include <Common/logger_useful.h>
-#include <base/sort.h>
 
 #include <algorithm>
-#include <thread>
 #include <numeric>
 
 
@@ -312,3 +312,5 @@ bool SlabsPolygonIndex::find(const Point & point, size_t & id) const
 }
 
 }
+
+// NOLINTEND

From 4ff1465927b1621acc67038f18cdb53f35f6e915 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 06:40:00 +0200
Subject: [PATCH 212/289] Useless changes

---
 src/Compression/tests/gtest_compressionCodec.cpp                | 2 +-
 .../tests/gtest_inline_escaping_key_state_handler.cpp           | 1 -
 .../keyvaluepair/tests/gtest_no_escaping_key_state_handler.cpp  | 2 --
 3 files changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Compression/tests/gtest_compressionCodec.cpp b/src/Compression/tests/gtest_compressionCodec.cpp
index f3f6345a5b5..283ccd95f14 100644
--- a/src/Compression/tests/gtest_compressionCodec.cpp
+++ b/src/Compression/tests/gtest_compressionCodec.cpp
@@ -794,7 +794,7 @@ std::vector<CodecTestSequence> generatePyramidOfSequences(const size_t sequences
     for (size_t i = 1; i < sequences_count; ++i)
     {
         std::string name = generator_name + std::string(" from 0 to ") + std::to_string(i);
-        sequences.push_back(generateSeq<T>(std::forward<decltype(generator)>(generator), name.c_str(), 0, i));
+        sequences.push_back(generateSeq<T>(generator, name.c_str(), 0, i));
     }
 
     return sequences;
diff --git a/src/Functions/keyvaluepair/tests/gtest_inline_escaping_key_state_handler.cpp b/src/Functions/keyvaluepair/tests/gtest_inline_escaping_key_state_handler.cpp
index afffb9f6108..c8fe5874281 100644
--- a/src/Functions/keyvaluepair/tests/gtest_inline_escaping_key_state_handler.cpp
+++ b/src/Functions/keyvaluepair/tests/gtest_inline_escaping_key_state_handler.cpp
@@ -84,7 +84,6 @@ TEST(extractKVPairInlineEscapingKeyStateHandler, Read)
 
     std::string key_str = "name";
     std::string key_with_delimiter_str = key_str + ':';
-    std::string key_with_delimiter_and_left_spacing = "  " + key_with_delimiter_str;
     std::string key_with_delimiter_and_random_characters_str = key_str + ':' + "a$a\\:''\"";
 
     // no delimiter, should discard
diff --git a/src/Functions/keyvaluepair/tests/gtest_no_escaping_key_state_handler.cpp b/src/Functions/keyvaluepair/tests/gtest_no_escaping_key_state_handler.cpp
index c849fa56d9f..c4a3feed63e 100644
--- a/src/Functions/keyvaluepair/tests/gtest_no_escaping_key_state_handler.cpp
+++ b/src/Functions/keyvaluepair/tests/gtest_no_escaping_key_state_handler.cpp
@@ -87,7 +87,6 @@ TEST(extractKVPairNoEscapingKeyStateHandler, Read)
 
     std::string key_str = "name";
     std::string key_with_delimiter_str = key_str + ':';
-    std::string key_with_delimiter_and_left_spacing = "  " + key_with_delimiter_str;
     std::string key_with_delimiter_and_random_characters_str = key_str + ':' + "a$a\\:''\"";
 
     // no delimiter, should discard
@@ -101,4 +100,3 @@ TEST(extractKVPairNoEscapingKeyStateHandler, Read)
 
     test_read(handler, "", "", 0u, State::END);
 }
-

From 2794a6635ea67b944395a6af3edd334d5d6b3f2a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 06:58:21 +0200
Subject: [PATCH 213/289] Useless changes

---
 .clang-tidy                                            | 4 ++--
 src/AggregateFunctions/AggregateFunctionFlameGraph.cpp | 2 +-
 src/Client/ClientBase.cpp                              | 4 ++--
 src/Dictionaries/PolygonDictionary.cpp                 | 3 ++-
 src/Dictionaries/PolygonDictionaryImplementations.cpp  | 3 ++-
 src/Dictionaries/PolygonDictionaryUtils.cpp            | 3 ++-
 src/Storages/System/StorageSystemDDLWorkerQueue.cpp    | 9 ++++++---
 src/Storages/System/StorageSystemZooKeeper.cpp         | 2 +-
 8 files changed, 18 insertions(+), 12 deletions(-)

diff --git a/.clang-tidy b/.clang-tidy
index d4e326adcc5..54f54f3fdaa 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -123,6 +123,8 @@ Checks: [
   '-readability-uppercase-literal-suffix',
   '-readability-use-anyofallof',
 
+  '-zircon-*'
+
   # These are new in clang-18, and we have to sort them out:
   '-readability-avoid-nested-conditional-operator',
   '-modernize-use-designated-initializers',
@@ -133,8 +135,6 @@ Checks: [
   '-bugprone-suspicious-stringview-data-usage',
   '-bugprone-multi-level-implicit-pointer-conversion',
   '-cert-err33-c',
-
-  '-zircon-*'
 ]
 
 WarningsAsErrors: '*'
diff --git a/src/AggregateFunctions/AggregateFunctionFlameGraph.cpp b/src/AggregateFunctions/AggregateFunctionFlameGraph.cpp
index 33e318b6c2f..204edd83215 100644
--- a/src/AggregateFunctions/AggregateFunctionFlameGraph.cpp
+++ b/src/AggregateFunctions/AggregateFunctionFlameGraph.cpp
@@ -269,9 +269,9 @@ struct AggregateFunctionFlameGraphData
 
     using Entries = HashMap<UInt64, Pair>;
 
-    AggregateFunctionFlameGraphTree tree;
     Entries entries;
     Entry * free_list = nullptr;
+    AggregateFunctionFlameGraphTree tree;
 
     Entry * alloc(Arena * arena)
     {
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index b3544264ff0..67aba2256e8 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -2810,9 +2810,9 @@ public:
      * Parses arguments by replacing dashes with underscores, and matches the resulting name with known options
      * Implements boost::program_options::ext_parser logic
      */
-    std::pair<std::string, std::string> operator()(const std::string& token) const
+    std::pair<std::string, std::string> operator()(const std::string & token) const
     {
-        if (token.starts_with("--"))
+        if (!token.starts_with("--"))
             return {};
         std::string arg = token.substr(2);
 
diff --git a/src/Dictionaries/PolygonDictionary.cpp b/src/Dictionaries/PolygonDictionary.cpp
index 7c67079b09e..41c50ef9b63 100644
--- a/src/Dictionaries/PolygonDictionary.cpp
+++ b/src/Dictionaries/PolygonDictionary.cpp
@@ -1,4 +1,5 @@
-// NOLINTBEGIN // clang-tidy-19 crashes
+// NOLINTBEGIN
+// clang-tidy-19 crashes
 
 #include "PolygonDictionary.h"
 
diff --git a/src/Dictionaries/PolygonDictionaryImplementations.cpp b/src/Dictionaries/PolygonDictionaryImplementations.cpp
index 44d5f462ec4..317fa481c03 100644
--- a/src/Dictionaries/PolygonDictionaryImplementations.cpp
+++ b/src/Dictionaries/PolygonDictionaryImplementations.cpp
@@ -1,4 +1,5 @@
-// NOLINTBEGIN // clang-tidy-19 crashes
+// NOLINTBEGIN
+// clang-tidy-19 crashes
 
 #include "PolygonDictionaryImplementations.h"
 #include "DictionaryFactory.h"
diff --git a/src/Dictionaries/PolygonDictionaryUtils.cpp b/src/Dictionaries/PolygonDictionaryUtils.cpp
index fb641ce5b91..7990f4f77ef 100644
--- a/src/Dictionaries/PolygonDictionaryUtils.cpp
+++ b/src/Dictionaries/PolygonDictionaryUtils.cpp
@@ -1,4 +1,5 @@
-// NOLINTBEGIN // clang-tidy-19 crashes
+// NOLINTBEGIN
+// clang-tidy-19 crashes
 
 #include "PolygonDictionaryUtils.h"
 
diff --git a/src/Storages/System/StorageSystemDDLWorkerQueue.cpp b/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
index 661a31ab7eb..f96b839a322 100644
--- a/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
+++ b/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
@@ -183,7 +183,10 @@ static void fillStatusColumns(MutableColumns & res_columns, size_t & col,
 {
     auto maybe_finished_status = finished_data_future.get();
     if (maybe_finished_status.error == Coordination::Error::ZNONODE)
-        return fillStatusColumnsWithNulls(res_columns, col, Status::REMOVING);
+    {
+        fillStatusColumnsWithNulls(res_columns, col, Status::REMOVING);
+        return;
+    }
 
     /// asyncTryGet should throw on other error codes
     assert(maybe_finished_status.error == Coordination::Error::ZOK);
@@ -199,9 +202,9 @@ static void fillStatusColumns(MutableColumns & res_columns, size_t & col,
 
     UInt64 query_finish_time_ms = maybe_finished_status.stat.ctime;
     /// query_finish_time
-    res_columns[col++]->insert(static_cast<UInt64>(query_finish_time_ms / 1000));
+    res_columns[col++]->insert(query_finish_time_ms / 1000);
     /// query_duration_ms
-    res_columns[col++]->insert(static_cast<UInt64>(query_finish_time_ms - query_create_time_ms));
+    res_columns[col++]->insert(query_finish_time_ms - query_create_time_ms);
 }
 
 
diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 14bd89b41ad..7afa1894a64 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -104,7 +104,7 @@ struct ZkNodeCache
             auto request = zkutil::makeSetRequest(path, value, -1);
             requests.push_back(request);
         }
-        for (auto [_, child] : children)
+        for (const auto & [_, child] : children)
             child->generateRequests(requests);
     }
 };

From 51a9657933bf7e50dbe9783cb163bb64f452cccb Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 07:12:26 +0200
Subject: [PATCH 214/289] Useless changes

---
 src/Storages/examples/merge_selector2.cpp | 10 +++-------
 1 file changed, 3 insertions(+), 7 deletions(-)

diff --git a/src/Storages/examples/merge_selector2.cpp b/src/Storages/examples/merge_selector2.cpp
index 029da26fad6..5d5ad3857cf 100644
--- a/src/Storages/examples/merge_selector2.cpp
+++ b/src/Storages/examples/merge_selector2.cpp
@@ -3,7 +3,6 @@
 #include <IO/ReadBufferFromFileDescriptor.h>
 #include <IO/Operators.h>
 #include <Storages/MergeTree/SimpleMergeSelector.h>
-#include <Storages/MergeTree/LevelMergeSelector.h>
 #include <Common/formatReadable.h>
 
 
@@ -22,11 +21,8 @@ int main(int, char **)
     IMergeSelector::PartsRanges partitions(1);
     IMergeSelector::PartsRange & parts = partitions.back();
 
-/*    SimpleMergeSelector::Settings settings;
-    SimpleMergeSelector selector(settings);*/
-
-    LevelMergeSelector::Settings settings;
-    LevelMergeSelector selector(settings);
+    SimpleMergeSelector::Settings settings;
+    SimpleMergeSelector selector(settings);
 
     ReadBufferFromFileDescriptor in(STDIN_FILENO);
 
@@ -40,7 +36,7 @@ int main(int, char **)
         IMergeSelector::Part part;
         in >> part.size >> "\t" >> part.age >> "\t" >> part.level >> "\t" >> part_names.back() >> "\n";
         part.data = part_names.back().data();
-//        part.level = 0;
+        part.level = 0;
         parts.emplace_back(part);
         sum_parts_size += part.size;
     }

From a05fccf8cc92f30ee27618ee067697613bc7ade1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 10 May 2024 07:30:40 +0200
Subject: [PATCH 215/289] Useless changes

---
 src/Server/GRPCServer.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index 43252555ef8..10b59751b22 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -639,7 +639,7 @@ namespace
 
 
     /// Handles a connection after a responder is started (i.e. after getting a new call).
-    class Call
+    class Call // NOLINT(clang-analyzer-optin.performance.Padding)
     {
     public:
         Call(CallType call_type_, std::unique_ptr<BaseResponder> responder_, IServer & iserver_, LoggerRawPtr log_);

From 291bb146967375f58a527f50c2e40f0d7ee36fca Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 6 May 2024 13:08:01 +0200
Subject: [PATCH 216/289] The Dockerfile is reviewed by docker-official

`apt-get upgrade` shouldn't be executed during the build
`apt-get clean` is a noop
`gpg` should use batch and download key by full fingreprints
The CI specific steps shouln't be presented in docker library
Using `COPY --chmod` instead of two layers is not possible yet, but
  entrypoint.sh already contains +x bit in the git repo
---
 docker/server/Dockerfile.ubuntu | 18 ++++++++++++------
 1 file changed, 12 insertions(+), 6 deletions(-)

diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 7292163023d..d82be0e63f6 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -1,11 +1,14 @@
 FROM ubuntu:20.04
 
 # see https://github.com/moby/moby/issues/4032#issuecomment-192327844
+# It could be removed after we move on a version 23:04+
 ARG DEBIAN_FRONTEND=noninteractive
 
 # ARG for quick switch to a given ubuntu mirror
 ARG apt_archive="http://archive.ubuntu.com"
 
+# We shouldn't use `apt upgrade` to not change the upstream image. It's updated biweekly
+
 # user/group precreated explicitly with fixed uid/gid on purpose.
 # It is especially important for rootless containers: in that case entrypoint
 # can't do chown and owners of mounted volumes should be configured externally.
@@ -16,13 +19,11 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
     && groupadd -r clickhouse --gid=101 \
     && useradd -r -g clickhouse --uid=101 --home-dir=/var/lib/clickhouse --shell=/bin/bash clickhouse \
     && apt-get update \
-    && apt-get upgrade -yq \
     && apt-get install --yes --no-install-recommends \
         ca-certificates \
         locales \
         tzdata \
         wget \
-    && apt-get clean \
     && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 ARG REPO_CHANNEL="stable"
@@ -30,6 +31,9 @@ ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https
 ARG VERSION="24.4.1.2088"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
+#docker-official-library:off
+# The part between `docker-official-library` tags is related to our builds
+
 # set non-empty deb_location_url url to create a docker image
 # from debs created by CI build, for example:
 # docker build . --network host --build-arg version="21.4.1.6282" --build-arg deb_location_url="https://..." -t ...
@@ -80,19 +84,22 @@ RUN if [ -n "${single_binary_location_url}" ]; then \
         && rm -rf /tmp/* ; \
     fi
 
+# The rest is the same in the official docker and in our build system
+#docker-official-library:on
+
 # A fallback to installation from ClickHouse repository
 RUN if ! clickhouse local -q "SELECT ''" > /dev/null 2>&1; then \
         apt-get update \
         && apt-get install --yes --no-install-recommends \
             apt-transport-https \
-            ca-certificates \
             dirmngr \
             gnupg2 \
         && mkdir -p /etc/apt/sources.list.d \
         && GNUPGHOME=$(mktemp -d) \
-        && GNUPGHOME="$GNUPGHOME" gpg --no-default-keyring \
+        && GNUPGHOME="$GNUPGHOME" gpg --batch --no-default-keyring \
             --keyring /usr/share/keyrings/clickhouse-keyring.gpg \
-            --keyserver hkp://keyserver.ubuntu.com:80 --recv-keys 8919F6BD2B48D754 \
+            --keyserver hkp://keyserver.ubuntu.com:80 \
+            --recv-keys 3a9ea1193a97b548be1457d48919f6bd2b48d754 \
         && rm -rf "$GNUPGHOME" \
         && chmod +r /usr/share/keyrings/clickhouse-keyring.gpg \
         && echo "${REPOSITORY}" > /etc/apt/sources.list.d/clickhouse.list \
@@ -127,7 +134,6 @@ RUN mkdir /docker-entrypoint-initdb.d
 
 COPY docker_related_config.xml /etc/clickhouse-server/config.d/
 COPY entrypoint.sh /entrypoint.sh
-RUN chmod +x /entrypoint.sh
 
 EXPOSE 9000 8123 9009
 VOLUME /var/lib/clickhouse

From 544875fd2f20c0e2501d71bc87eeaa57d57c63cd Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 6 Dec 2023 14:40:39 +0100
Subject: [PATCH 217/289] Apply markdownfmt.sh from
 https://github.com/docker-library/docs

---
 docker/server/README.md | 39 ++++++++++++++++++---------------------
 1 file changed, 18 insertions(+), 21 deletions(-)

diff --git a/docker/server/README.md b/docker/server/README.md
index d6cf2dfdf09..65239126790 100644
--- a/docker/server/README.md
+++ b/docker/server/README.md
@@ -4,33 +4,34 @@
 
 ClickHouse is an open-source column-oriented DBMS (columnar database management system) for online analytical processing (OLAP) that allows users to generate analytical reports using SQL queries in real-time.
 
-ClickHouse works 100-1000x faster than traditional database management systems, and processes hundreds of millions to over a billion rows and tens of gigabytes of data per server per second.  With a widespread user base around the globe, the technology has received praise for its reliability, ease of use, and fault tolerance.
+ClickHouse works 100-1000x faster than traditional database management systems, and processes hundreds of millions to over a billion rows and tens of gigabytes of data per server per second. With a widespread user base around the globe, the technology has received praise for its reliability, ease of use, and fault tolerance.
 
 For more information and documentation see https://clickhouse.com/.
 
 ## Versions
 
-- The `latest` tag points to the latest release of the latest stable branch.
-- Branch tags like `22.2` point to the latest release of the corresponding branch.
-- Full version tags like `22.2.3.5` point to the corresponding release.
-- The tag `head` is built from the latest commit to the default branch.
-- Each tag has optional `-alpine` suffix to reflect that it's built on top of `alpine`.
+-	The `latest` tag points to the latest release of the latest stable branch.
+-	Branch tags like `22.2` point to the latest release of the corresponding branch.
+-	Full version tags like `22.2.3.5` point to the corresponding release.
+-	The tag `head` is built from the latest commit to the default branch.
+-	Each tag has optional `-alpine` suffix to reflect that it's built on top of `alpine`.
 
 ### Compatibility
 
-- The amd64 image requires support for [SSE3 instructions](https://en.wikipedia.org/wiki/SSE3). Virtually all x86 CPUs after 2005 support SSE3.
-- The arm64 image requires support for the [ARMv8.2-A architecture](https://en.wikipedia.org/wiki/AArch64#ARMv8.2-A) and additionally the Load-Acquire RCpc register. The register is optional in version ARMv8.2-A and mandatory in [ARMv8.3-A](https://en.wikipedia.org/wiki/AArch64#ARMv8.3-A). Supported in Graviton >=2, Azure and GCP instances. Examples for unsupported devices are Raspberry Pi 4 (ARMv8.0-A) and Jetson AGX Xavier/Orin (ARMv8.2-A).
+-	The amd64 image requires support for [SSE3 instructions](https://en.wikipedia.org/wiki/SSE3). Virtually all x86 CPUs after 2005 support SSE3.
+-	The arm64 image requires support for the [ARMv8.2-A architecture](https://en.wikipedia.org/wiki/AArch64#ARMv8.2-A) and additionally the Load-Acquire RCpc register. The register is optional in version ARMv8.2-A and mandatory in [ARMv8.3-A](https://en.wikipedia.org/wiki/AArch64#ARMv8.3-A). Supported in Graviton >=2, Azure and GCP instances. Examples for unsupported devices are Raspberry Pi 4 (ARMv8.0-A) and Jetson AGX Xavier/Orin (ARMv8.2-A).
 
 ## How to use this image
 
 ### start server instance
+
 ```bash
 docker run -d --name some-clickhouse-server --ulimit nofile=262144:262144 clickhouse/clickhouse-server
 ```
 
 By default, ClickHouse will be accessible only via the Docker network. See the [networking section below](#networking).
 
-By default, starting above server instance will be run as the `default` user without  password.
+By default, starting above server instance will be run as the `default` user without password.
 
 ### connect to it from a native client
 
@@ -66,9 +67,7 @@ docker run -d -p 18123:8123 -p19000:9000 --name some-clickhouse-server --ulimit
 echo 'SELECT version()' | curl 'http://localhost:18123/' --data-binary @-
 ```
 
-```
-22.6.3.35
-```
+`22.6.3.35`
 
 or by allowing the container to use [host ports directly](https://docs.docker.com/network/host/) using `--network=host` (also allows achieving better network performance):
 
@@ -77,16 +76,14 @@ docker run -d --network=host --name some-clickhouse-server --ulimit nofile=26214
 echo 'SELECT version()' | curl 'http://localhost:8123/' --data-binary @-
 ```
 
-```
-22.6.3.35
-```
+`22.6.3.35`
 
 ### Volumes
 
 Typically you may want to mount the following folders inside your container to achieve persistency:
 
-* `/var/lib/clickhouse/` - main folder where ClickHouse stores the data
-* `/var/log/clickhouse-server/` - logs
+-	`/var/lib/clickhouse/` - main folder where ClickHouse stores the data
+-	`/var/log/clickhouse-server/` - logs
 
 ```bash
 docker run -d \
@@ -97,9 +94,9 @@ docker run -d \
 
 You may also want to mount:
 
-* `/etc/clickhouse-server/config.d/*.xml` - files with server configuration adjustments
-* `/etc/clickhouse-server/users.d/*.xml` - files with user settings adjustments
-* `/docker-entrypoint-initdb.d/` - folder with database initialization scripts (see below).
+-	`/etc/clickhouse-server/config.d/*.xml` - files with server configuration adjustments
+-	`/etc/clickhouse-server/users.d/*.xml` - files with user settings adjustments
+-	`/docker-entrypoint-initdb.d/` - folder with database initialization scripts (see below).
 
 ### Linux capabilities
 
@@ -150,7 +147,7 @@ docker run --rm -e CLICKHOUSE_DB=my_database -e CLICKHOUSE_USER=username -e CLIC
 
 ## How to extend this image
 
-To perform additional initialization in an image derived from this one, add one or more `*.sql`, `*.sql.gz`, or `*.sh` scripts under `/docker-entrypoint-initdb.d`. After the entrypoint calls `initdb`, it will run any `*.sql` files, run any executable `*.sh` scripts, and source any non-executable `*.sh` scripts found in that directory to do further initialization before starting the service.
+To perform additional initialization in an image derived from this one, add one or more `*.sql`, `*.sql.gz`, or `*.sh` scripts under `/docker-entrypoint-initdb.d`. After the entrypoint calls `initdb`, it will run any `*.sql` files, run any executable `*.sh` scripts, and source any non-executable `*.sh` scripts found in that directory to do further initialization before starting the service.  
 Also, you can provide environment variables `CLICKHOUSE_USER` & `CLICKHOUSE_PASSWORD` that will be used for clickhouse-client during initialization.
 
 For example, to add an additional user and database, add the following to `/docker-entrypoint-initdb.d/init-db.sh`:

From 0586952eca510dfee3f958ae4aa44311312c72d2 Mon Sep 17 00:00:00 2001
From: Alexander van Olst <alexander.vanolst@coralogix.com>
Date: Fri, 10 May 2024 11:22:50 +0200
Subject: [PATCH 218/289] Fix links to IETF Base58 draft

---
 docs/en/sql-reference/functions/string-functions.md | 4 ++--
 docs/ru/sql-reference/functions/string-functions.md | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index e6703b573cb..ba23870a584 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -1058,7 +1058,7 @@ convertCharset(s, from, to)
 
 ## base58Encode
 
-Encodes a String using [Base58](https://tools.ietf.org/id/draft-msporny-base58-01.html) in the "Bitcoin" alphabet.
+Encodes a String using [Base58](https://datatracker.ietf.org/doc/html/draft-msporny-base58) in the "Bitcoin" alphabet.
 
 **Syntax**
 
@@ -1092,7 +1092,7 @@ Result:
 
 ## base58Decode
 
-Accepts a String and decodes it using [Base58](https://tools.ietf.org/id/draft-msporny-base58-01.html) encoding scheme using "Bitcoin" alphabet.
+Accepts a String and decodes it using [Base58](https://datatracker.ietf.org/doc/html/draft-msporny-base58) encoding scheme using "Bitcoin" alphabet.
 
 **Syntax**
 
diff --git a/docs/ru/sql-reference/functions/string-functions.md b/docs/ru/sql-reference/functions/string-functions.md
index 276dfc2ef20..eeb5752c626 100644
--- a/docs/ru/sql-reference/functions/string-functions.md
+++ b/docs/ru/sql-reference/functions/string-functions.md
@@ -493,7 +493,7 @@ SELECT concat(key1, key2), sum(value) FROM key_val GROUP BY (key1, key2);
 
 ## base58Encode(plaintext), base58Decode(encoded_text) {#base58}
 
-Принимает на вход строку или колонку строк и кодирует/раскодирует их с помощью схемы кодирования [Base58](https://tools.ietf.org/id/draft-msporny-base58-01.html) с использованием стандартного алфавита Bitcoin.
+Принимает на вход строку или колонку строк и кодирует/раскодирует их с помощью схемы кодирования [Base58](https://datatracker.ietf.org/doc/html/draft-msporny-base58) с использованием стандартного алфавита Bitcoin.
 
 **Синтаксис**
 

From d3ff638d4e5fee52fdba9f10dc519ef000af2e82 Mon Sep 17 00:00:00 2001
From: Yohann Jardin <yohann.jardin@telecomnancy.net>
Date: Fri, 10 May 2024 13:04:16 +0200
Subject: [PATCH 219/289] harmonize sumMap error messages on
 ILLEGAL_TYPE_OF_ARGUMENT

---
 src/AggregateFunctions/AggregateFunctionSumMap.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionSumMap.cpp b/src/AggregateFunctions/AggregateFunctionSumMap.cpp
index 9f0873a6c9c..666136a91b7 100644
--- a/src/AggregateFunctions/AggregateFunctionSumMap.cpp
+++ b/src/AggregateFunctions/AggregateFunctionSumMap.cpp
@@ -711,7 +711,7 @@ auto parseArguments(const std::string & name, const DataTypes & arguments)
 
     const auto * array_type = checkAndGetDataType<DataTypeArray>(args[0].get());
     if (!array_type)
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "First argument for function {} must be an array, not {}",
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Argument #1 for function {} must be an array, not {}",
             name, args[0]->getName());
 
     DataTypePtr keys_type = array_type->getNestedType();
@@ -722,8 +722,8 @@ auto parseArguments(const std::string & name, const DataTypes & arguments)
     {
         array_type = checkAndGetDataType<DataTypeArray>(args[i].get());
         if (!array_type)
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Argument #{} for function {} must be an array.",
-                i, name);
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Argument #{} for function {} must be an array, not {}",
+                i + 1, name, args[i]->getName());
         values_types.push_back(array_type->getNestedType());
     }
 

From a406871c80ac5caf046b8a676dcada70904913d3 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Fri, 10 May 2024 14:28:55 +0200
Subject: [PATCH 220/289] Fix style

---
 tests/integration/test_storage_hdfs/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index 8538fa522f7..bb72574c6e5 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -1125,7 +1125,7 @@ def test_write_to_globbed_partitioned_path(started_cluster):
 
     assert "DATABASE_ACCESS_DENIED" in error
 
-    
+
 def test_respect_object_existence_on_partitioned_write(started_cluster):
     node = started_cluster.instances["node1"]
 

From a43faf7399bea97726ac12bdc37024b3ae55f451 Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Fri, 10 May 2024 16:19:53 +0300
Subject: [PATCH 221/289] added check that tmp_data != nullptr

---
 src/Interpreters/HashJoin.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index eb38b2b4fe9..525ca4a2a91 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -252,7 +252,7 @@ HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_s
     , instance_id(instance_id_)
     , asof_inequality(table_join->getAsofInequality())
     , data(std::make_shared<RightTableData>())
-    , tmp_data(std::make_unique<TemporaryDataOnDisk>(table_join_->getTempDataOnDisk()))
+    , tmp_data(table_join_->getTempDataOnDisk() ? std::make_unique<TemporaryDataOnDisk>(table_join_->getTempDataOnDisk()) : nullptr)
     , right_sample_block(right_sample_block_)
     , max_joined_block_rows(table_join->maxJoinedBlockRows())
     , instance_log_id(!instance_id_.empty() ? "(" + instance_id_ + ") " : "")

From 4da5cfda6ccdd0c822ba0d0f7a3233065ab60cbe Mon Sep 17 00:00:00 2001
From: Tyler Hannan <tyler@clickhouse.com>
Date: Fri, 10 May 2024 17:49:38 +0200
Subject: [PATCH 222/289] Update README.md

Removing Bangalore Meetup & Adding Boston Meetup
---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index d7202454332..73d989210b5 100644
--- a/README.md
+++ b/README.md
@@ -40,7 +40,6 @@ Every month we get together with the community (users, contributors, customers,
 
 Keep an eye out for upcoming meetups and events around the world. Somewhere else you want us to be? Please feel free to reach out to tyler `<at>` clickhouse `<dot>` com. You can also peruse [ClickHouse Events](https://clickhouse.com/company/news-events) for a list of all upcoming trainings, meetups, speaking engagements, etc.
 
-* [ClickHouse Meetup in Bengaluru](https://www.meetup.com/clickhouse-bangalore-user-group/events/300405581/) - May 4
 * [ClickHouse Happy Hour @ Tom's Watch Bar - Los Angeles](https://www.meetup.com/clickhouse-los-angeles-user-group/events/300740584/) - May 22
 * [ClickHouse & Confluent Meetup in Dubai](https://www.meetup.com/clickhouse-dubai-meetup-group/events/299629189/) - May 28
 * [ClickHouse Meetup in Stockholm](https://www.meetup.com/clickhouse-stockholm-user-group/events/299752651/) - Jun 3
@@ -49,6 +48,7 @@ Keep an eye out for upcoming meetups and events around the world. Somewhere else
 * [ClickHouse Meetup in Amsterdam](https://www.meetup.com/clickhouse-netherlands-user-group/events/300781068/) - Jun 27
 * [ClickHouse Meetup in Paris](https://www.meetup.com/clickhouse-france-user-group/events/300783448/) - Jul 9
 * [ClickHouse Meetup @ Ramp - New York City](https://www.meetup.com/clickhouse-new-york-user-group/events/300595845/) - Jul 9
+* [ClickHouse Meetup @ Klaviyo - Boston](https://www.meetup.com/clickhouse-boston-user-group/events/300907870) - Jul 11
 
 ## Recent Recordings
 * **Recent Meetup Videos**: [Meetup Playlist](https://www.youtube.com/playlist?list=PL0Z2YDlm0b3iNDUzpY1S3L_iV4nARda_U) Whenever possible recordings of the ClickHouse Community Meetups are edited and presented as individual talks. Current featuring "Modern SQL in 2023", "Fast, Concurrent, and Consistent Asynchronous INSERTS in ClickHouse", and "Full-Text Indices: Design and Experiments"

From ee76eede55606d3e86cab6a2973fc93881265b8c Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 10 May 2024 20:02:01 +0200
Subject: [PATCH 223/289] Add file path into "File must not be a directory"
 message

This is to fix 00002_log_and_exception_messages_formatting

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageFile.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageFile.cpp b/src/Storages/StorageFile.cpp
index 430e68d8562..76d75a368b3 100644
--- a/src/Storages/StorageFile.cpp
+++ b/src/Storages/StorageFile.cpp
@@ -224,7 +224,7 @@ void checkCreationIsAllowed(
     {
         auto table_path_stat = fs::status(table_path);
         if (fs::exists(table_path_stat) && fs::is_directory(table_path_stat))
-            throw Exception(ErrorCodes::INCORRECT_FILE_NAME, "File must not be a directory");
+            throw Exception(ErrorCodes::INCORRECT_FILE_NAME, "File {} must not be a directory", table_path);
     }
 }
 

From 72f813a42067a94284bdac649751c52c056d53be Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 10 May 2024 20:02:20 +0200
Subject: [PATCH 224/289] Cleanup excludes for
 00002_log_and_exception_messages_formatting

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../00002_log_and_exception_messages_formatting.sql            | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql b/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
index 573321cfee1..8e84d731592 100644
--- a/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
+++ b/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
@@ -101,8 +101,6 @@ create temporary table known_short_messages (s String) as select * from (select
     'Found part {}',
     'Host is empty in S3 URI.',
     'INTO OUTFILE is not allowed',
-    'Illegal type {} of argument of function {}. Should be DateTime or DateTime64',
-    'Illegal UTF-8 sequence, while processing \'{}\'',
     'Invalid cache key hex: {}',
     'Invalid date: {}',
     'Invalid mode: {}',
@@ -128,7 +126,6 @@ create temporary table known_short_messages (s String) as select * from (select
     'Sending part {}',
     'Sent handshake',
     'Starting {}',
-    'String size is too big ({}), maximum: {}',
     'Substitution {} is not set',
     'Table {} does not exist',
     'Table {} doesn\'t exist',

From 439229ef2b3e586b3e9196caa9e8bde963256a5f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 16 Apr 2024 13:10:21 +0300
Subject: [PATCH 225/289] Bump yaml-cpp for YAML Merge Key support

Refs: https://github.com/ClickHouse/yaml-cpp/pull/2
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 contrib/yaml-cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/yaml-cpp b/contrib/yaml-cpp
index 0c86adac6d1..97ea28a7a23 160000
--- a/contrib/yaml-cpp
+++ b/contrib/yaml-cpp
@@ -1 +1 @@
-Subproject commit 0c86adac6d117ee2b4afcedb8ade19036ca0327d
+Subproject commit 97ea28a7a235cc210d7bb116ac8f7f435add921a

From 4770446dbe9f9a418ccdee906e5d244e5c77fe2a Mon Sep 17 00:00:00 2001
From: Eduard Karacharov <eduard.karacharov@semrush.com>
Date: Thu, 2 May 2024 19:07:04 +0300
Subject: [PATCH 226/289] test: yaml merge keys

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../test_config_yaml_merge_keys/__init__.py   |  0
 .../configs/merge_keys.yml                    | 41 +++++++++++
 .../test_config_yaml_merge_keys/test.py       | 68 +++++++++++++++++++
 3 files changed, 109 insertions(+)
 create mode 100644 tests/integration/test_config_yaml_merge_keys/__init__.py
 create mode 100644 tests/integration/test_config_yaml_merge_keys/configs/merge_keys.yml
 create mode 100644 tests/integration/test_config_yaml_merge_keys/test.py

diff --git a/tests/integration/test_config_yaml_merge_keys/__init__.py b/tests/integration/test_config_yaml_merge_keys/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_config_yaml_merge_keys/configs/merge_keys.yml b/tests/integration/test_config_yaml_merge_keys/configs/merge_keys.yml
new file mode 100644
index 00000000000..2fcceeb7ddb
--- /dev/null
+++ b/tests/integration/test_config_yaml_merge_keys/configs/merge_keys.yml
@@ -0,0 +1,41 @@
+---
+settings_common: &settings_common
+  max_threads: 1
+  max_final_threads: 1
+
+settings_extended: &settings_extended
+  max_final_threads: 2
+
+profiles:
+  profile_1:
+    <<: *settings_common
+  profile_2:
+    <<: *settings_common
+    max_threads: 4
+  profile_3:
+    max_threads: 4
+    <<: *settings_common
+  profile_4:
+    <<: *settings_common
+    <<: *settings_extended
+    max_threads: 4
+  profile_5:
+    <<: [*settings_common, *settings_extended]
+    max_threads: 4
+
+users:
+  user_1:
+    profile: profile_1
+    password: ""
+  user_2:
+    profile: profile_2
+    password: ""
+  user_3:
+    profile: profile_3
+    password: ""
+  user_4:
+    profile: profile_4
+    password: ""
+  user_5:
+    profile: profile_5
+    password: ""
diff --git a/tests/integration/test_config_yaml_merge_keys/test.py b/tests/integration/test_config_yaml_merge_keys/test.py
new file mode 100644
index 00000000000..33db5fbcde0
--- /dev/null
+++ b/tests/integration/test_config_yaml_merge_keys/test.py
@@ -0,0 +1,68 @@
+
+
+import helpers
+import pytest
+from helpers.cluster import ClickHouseCluster
+
+
+def test_yaml_merge_keys_conf():
+    cluster = ClickHouseCluster(__file__)
+    node = cluster.add_instance(
+        "node",
+        user_configs=["configs/merge_keys.yml"]
+    )
+
+    try:
+        cluster.start()
+
+        # Assert simple merge key substitution
+        assert(
+            node.query(
+                "select getSetting('max_threads')", user="user_1"
+            ) == "1\n"
+        )
+
+        # Assert merge key overriden by regular key
+        assert(
+            node.query(
+                "select getSetting('max_threads')", user="user_2"
+            ) == "4\n"
+        )
+
+        # Assert normal key overriden by merge key
+        assert(
+            node.query(
+                "select getSetting('max_threads')", user="user_3"
+            ) == "1\n"
+        )
+
+        # Assert override with multiple merge keys
+        assert(
+            node.query(
+                "select getSetting('max_final_threads')", user="user_4"
+            ) == "2\n"
+        )
+
+        # Assert multiple merge key substitutions overriden by regular key
+        assert(
+            node.query(
+                "select getSetting('max_threads')", user="user_4"
+            ) == "4\n"
+        )
+
+        # Assert override with multiple merge keys for list syntax
+        assert(
+            node.query(
+                "select getSetting('max_final_threads')", user="user_5"
+            ) == "2\n"
+        )
+
+        # Assert multiple merge key substitutions overriden by regular key
+        # for list syntax
+        assert(
+            node.query(
+                "select getSetting('max_threads')", user="user_5"
+            ) == "4\n"
+        )
+    finally:
+        cluster.shutdown()

From fa3e8b3b2cf20309c8b406fc147e015a60c0f9e9 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 3 May 2024 12:32:06 +0200
Subject: [PATCH 227/289] Adjust the test_config_yaml_merge_keys expectations

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/integration/test_config_yaml_merge_keys/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_config_yaml_merge_keys/test.py b/tests/integration/test_config_yaml_merge_keys/test.py
index 33db5fbcde0..ab42696dbe2 100644
--- a/tests/integration/test_config_yaml_merge_keys/test.py
+++ b/tests/integration/test_config_yaml_merge_keys/test.py
@@ -33,7 +33,7 @@ def test_yaml_merge_keys_conf():
         assert(
             node.query(
                 "select getSetting('max_threads')", user="user_3"
-            ) == "1\n"
+            ) == "4\n"
         )
 
         # Assert override with multiple merge keys

From 65e66f98600c16438a5da287d2a4a192c685b5a5 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 3 May 2024 14:22:43 +0200
Subject: [PATCH 228/289] Apply black for test_config_yaml_merge_keys

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../test_config_yaml_merge_keys/test.py       | 49 ++++---------------
 1 file changed, 10 insertions(+), 39 deletions(-)

diff --git a/tests/integration/test_config_yaml_merge_keys/test.py b/tests/integration/test_config_yaml_merge_keys/test.py
index ab42696dbe2..e7ee164f170 100644
--- a/tests/integration/test_config_yaml_merge_keys/test.py
+++ b/tests/integration/test_config_yaml_merge_keys/test.py
@@ -1,5 +1,3 @@
-
-
 import helpers
 import pytest
 from helpers.cluster import ClickHouseCluster
@@ -7,62 +5,35 @@ from helpers.cluster import ClickHouseCluster
 
 def test_yaml_merge_keys_conf():
     cluster = ClickHouseCluster(__file__)
-    node = cluster.add_instance(
-        "node",
-        user_configs=["configs/merge_keys.yml"]
-    )
+    node = cluster.add_instance("node", user_configs=["configs/merge_keys.yml"])
 
     try:
         cluster.start()
 
         # Assert simple merge key substitution
-        assert(
-            node.query(
-                "select getSetting('max_threads')", user="user_1"
-            ) == "1\n"
-        )
+        assert node.query("select getSetting('max_threads')", user="user_1") == "1\n"
 
         # Assert merge key overriden by regular key
-        assert(
-            node.query(
-                "select getSetting('max_threads')", user="user_2"
-            ) == "4\n"
-        )
+        assert node.query("select getSetting('max_threads')", user="user_2") == "4\n"
 
         # Assert normal key overriden by merge key
-        assert(
-            node.query(
-                "select getSetting('max_threads')", user="user_3"
-            ) == "4\n"
-        )
+        assert node.query("select getSetting('max_threads')", user="user_3") == "4\n"
 
         # Assert override with multiple merge keys
-        assert(
-            node.query(
-                "select getSetting('max_final_threads')", user="user_4"
-            ) == "2\n"
+        assert (
+            node.query("select getSetting('max_final_threads')", user="user_4") == "2\n"
         )
 
         # Assert multiple merge key substitutions overriden by regular key
-        assert(
-            node.query(
-                "select getSetting('max_threads')", user="user_4"
-            ) == "4\n"
-        )
+        assert node.query("select getSetting('max_threads')", user="user_4") == "4\n"
 
         # Assert override with multiple merge keys for list syntax
-        assert(
-            node.query(
-                "select getSetting('max_final_threads')", user="user_5"
-            ) == "2\n"
+        assert (
+            node.query("select getSetting('max_final_threads')", user="user_5") == "2\n"
         )
 
         # Assert multiple merge key substitutions overriden by regular key
         # for list syntax
-        assert(
-            node.query(
-                "select getSetting('max_threads')", user="user_5"
-            ) == "4\n"
-        )
+        assert node.query("select getSetting('max_threads')", user="user_5") == "4\n"
     finally:
         cluster.shutdown()

From a0843f754abcdddbe698d3ed2f242e8c6408197a Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 3 May 2024 12:30:25 +0200
Subject: [PATCH 229/289] Bump yaml-cpp with proper keys merging PR

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 contrib/yaml-cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/yaml-cpp b/contrib/yaml-cpp
index 97ea28a7a23..2ce752f938e 160000
--- a/contrib/yaml-cpp
+++ b/contrib/yaml-cpp
@@ -1 +1 @@
-Subproject commit 97ea28a7a235cc210d7bb116ac8f7f435add921a
+Subproject commit 2ce752f938e9a7de203e744373935ad675e1ffe5

From 59adb61016468ef416a28399966af069d6aebcbc Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 10 May 2024 20:05:51 +0200
Subject: [PATCH 230/289] Bump yaml-cpp after PR merge

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 contrib/yaml-cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/yaml-cpp b/contrib/yaml-cpp
index 2ce752f938e..f91e9383412 160000
--- a/contrib/yaml-cpp
+++ b/contrib/yaml-cpp
@@ -1 +1 @@
-Subproject commit 2ce752f938e9a7de203e744373935ad675e1ffe5
+Subproject commit f91e938341273b5f9d341380ab17bcc3de5daa06

From 20363c6dcce4a04f6c235172429590e03e925f2f Mon Sep 17 00:00:00 2001
From: Michael Stetsyuk <mike.stetsyuk@gmail.com>
Date: Fri, 10 May 2024 19:10:24 +0100
Subject: [PATCH 231/289] fix 02362_part_log_merge_algorithm flaky test

---
 tests/queries/0_stateless/02362_part_log_merge_algorithm.sql | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02362_part_log_merge_algorithm.sql b/tests/queries/0_stateless/02362_part_log_merge_algorithm.sql
index 6446b46c393..99cdfcec2e5 100644
--- a/tests/queries/0_stateless/02362_part_log_merge_algorithm.sql
+++ b/tests/queries/0_stateless/02362_part_log_merge_algorithm.sql
@@ -7,7 +7,7 @@ ORDER BY key;
 INSERT INTO data_horizontal VALUES (1);
 OPTIMIZE TABLE data_horizontal FINAL;
 SYSTEM FLUSH LOGS;
-SELECT table, part_name, event_type, merge_algorithm FROM system.part_log WHERE event_date >= yesterday() AND database = currentDatabase() AND table = 'data_horizontal' ORDER BY event_time_microseconds;
+SELECT table, part_name, event_type, merge_algorithm FROM system.part_log WHERE event_date >= yesterday() AND database = currentDatabase() AND table = 'data_horizontal' AND event_type IN ('NewPart', 'MergeParts') ORDER BY event_time_microseconds;
 
 CREATE TABLE data_vertical
 (
@@ -23,4 +23,4 @@ INSERT INTO data_vertical VALUES (1, '1');
 INSERT INTO data_vertical VALUES (2, '2');
 OPTIMIZE TABLE data_vertical FINAL;
 SYSTEM FLUSH LOGS;
-SELECT table, part_name, event_type, merge_algorithm FROM system.part_log WHERE event_date >= yesterday() AND database = currentDatabase() AND table = 'data_vertical' ORDER BY event_time_microseconds;
+SELECT table, part_name, event_type, merge_algorithm FROM system.part_log WHERE event_date >= yesterday() AND database = currentDatabase() AND table = 'data_vertical' AND event_type IN ('NewPart', 'MergeParts') ORDER BY event_time_microseconds;

From b849890d45aabdb27e3079abfa2b223454087298 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 10 May 2024 22:54:01 +0200
Subject: [PATCH 232/289] Fix 02362_part_log_merge_algorithm flakiness

SYSTEM FLUSH LOGS can take awhile, which leads to that some parts may be
removed in case of old_parts_lifetime randomized to 10 [1]:

    2024.05.10 21:17:49.920514 [ 14551 ] {c15b0b5e-a1d1-4c87-b983-61ab185d50c1} <Debug> executeQuery: (from [::1]:58902) (comment: 02362_part_log_merge_algorithm.sql) SYSTEM FLUSH LOGS; (stage: Complete)
    2024.05.10 21:17:59.216021 [ 1416 ] {} <Trace> test_9436z6sd.data_horizontal (80dc2a4b-5a0c-4e10-9956-2b0cc1fa0b49): Found 1 old parts to remove. Parts: [all_1_1_0]
    2024.05.10 21:17:59.216192 [ 1416 ] {} <Debug> test_9436z6sd.data_horizontal (80dc2a4b-5a0c-4e10-9956-2b0cc1fa0b49): Removing 1 parts from filesystem (serially): Parts: [all_1_1_0]
    2024.05.10 21:17:59.217760 [ 1416 ] {} <Debug> test_9436z6sd.data_horizontal (80dc2a4b-5a0c-4e10-9956-2b0cc1fa0b49): Removing 1 parts from memory: Parts: [all_1_1_0]
    2024.05.10 21:18:09.403934 [ 14551 ] {8e961419-d1d1-4c0b-b706-8a0b3cdbb1af} <Debug> executeQuery: (from [::1]:58902) (comment: 02362_part_log_merge_algorithm.sql) SELECT table, part_name, event_type, merge_algorithm FROM system.part_log WHERE event_date >= yesterday() AND database = currentDatabase() AND table = 'data_horizontal' ORDER BY event_time_microseconds; (stage: Complete)

  [1]: https://s3.amazonaws.com/clickhouse-test-reports/63634/72f813a42067a94284bdac649751c52c056d53be/stateless_tests__debug__[1_5]/run.log

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../queries/0_stateless/02362_part_log_merge_algorithm.sql  | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02362_part_log_merge_algorithm.sql b/tests/queries/0_stateless/02362_part_log_merge_algorithm.sql
index 6446b46c393..f1607959ec4 100644
--- a/tests/queries/0_stateless/02362_part_log_merge_algorithm.sql
+++ b/tests/queries/0_stateless/02362_part_log_merge_algorithm.sql
@@ -2,7 +2,8 @@ CREATE TABLE data_horizontal (
     key Int
 )
 Engine=MergeTree()
-ORDER BY key;
+ORDER BY key
+SETTINGS old_parts_lifetime=600;
 
 INSERT INTO data_horizontal VALUES (1);
 OPTIMIZE TABLE data_horizontal FINAL;
@@ -17,7 +18,8 @@ CREATE TABLE data_vertical
 ENGINE = MergeTree()
 ORDER BY key
 SETTINGS index_granularity_bytes = 0, enable_mixed_granularity_parts = 0, min_bytes_for_wide_part = 0,
-vertical_merge_algorithm_min_rows_to_activate = 1, vertical_merge_algorithm_min_columns_to_activate = 1;
+vertical_merge_algorithm_min_rows_to_activate = 1, vertical_merge_algorithm_min_columns_to_activate = 1,
+old_parts_lifetime=600;
 
 INSERT INTO data_vertical VALUES (1, '1');
 INSERT INTO data_vertical VALUES (2, '2');

From 83a62c1d7c464b1a2e136fafe831c854d9854493 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 10 May 2024 23:00:18 +0200
Subject: [PATCH 233/289] Adjust old_parts_lifetime in
 02362_part_log_merge_algorithm as well

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/queries/0_stateless/02491_part_log_has_table_uuid.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02491_part_log_has_table_uuid.sql b/tests/queries/0_stateless/02491_part_log_has_table_uuid.sql
index 1d18962443c..d216b67f4b0 100644
--- a/tests/queries/0_stateless/02491_part_log_has_table_uuid.sql
+++ b/tests/queries/0_stateless/02491_part_log_has_table_uuid.sql
@@ -1,6 +1,6 @@
 -- Tags: no-ordinary-database
 
-create table data_02491 (key Int) engine=MergeTree() order by tuple();
+create table data_02491 (key Int) engine=MergeTree() order by tuple() settings old_parts_lifetime=600;
 insert into data_02491 values (1);
 optimize table data_02491 final;
 truncate table data_02491;

From 95bdd81d26cbd02cdabc9dcd2a370a1b1d95b795 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Wed, 27 Mar 2024 01:55:10 +0000
Subject: [PATCH 234/289] Fix crash when calling some functions on const
 low-cardinality columns

---
 src/Functions/IFunction.cpp                            | 10 ++++------
 .../03032_multi_search_const_low_cardinality.reference |  1 +
 .../03032_multi_search_const_low_cardinality.sql       |  1 +
 3 files changed, 6 insertions(+), 6 deletions(-)
 create mode 100644 tests/queries/0_stateless/03032_multi_search_const_low_cardinality.reference
 create mode 100644 tests/queries/0_stateless/03032_multi_search_const_low_cardinality.sql

diff --git a/src/Functions/IFunction.cpp b/src/Functions/IFunction.cpp
index d4c6b8f4ba6..847e0c8dd39 100644
--- a/src/Functions/IFunction.cpp
+++ b/src/Functions/IFunction.cpp
@@ -94,8 +94,8 @@ ColumnPtr replaceLowCardinalityColumnsByNestedAndGetDictionaryIndexes(
     {
         if (const auto * column_const = checkAndGetColumn<ColumnConst>(column.column.get()))
         {
-            column.column = column_const->removeLowCardinality()->cloneResized(num_rows);
-            column.type = removeLowCardinality(column.type);
+            column.column = ColumnConst::create(recursiveRemoveLowCardinality(column_const->getDataColumnPtr()), num_rows);
+            column.type = recursiveRemoveLowCardinality(column.type);
         }
     }
 
@@ -406,7 +406,6 @@ DataTypePtr IFunctionOverloadResolver::getReturnType(const ColumnsWithTypeAndNam
 {
     if (useDefaultImplementationForLowCardinalityColumns())
     {
-        bool has_low_cardinality = false;
         size_t num_full_low_cardinality_columns = 0;
         size_t num_full_ordinary_columns = 0;
 
@@ -421,7 +420,6 @@ DataTypePtr IFunctionOverloadResolver::getReturnType(const ColumnsWithTypeAndNam
             if (const auto * low_cardinality_type = typeid_cast<const DataTypeLowCardinality *>(arg.type.get()))
             {
                 arg.type = low_cardinality_type->getDictionaryType();
-                has_low_cardinality = true;
 
                 if (!is_const)
                     ++num_full_low_cardinality_columns;
@@ -434,8 +432,8 @@ DataTypePtr IFunctionOverloadResolver::getReturnType(const ColumnsWithTypeAndNam
 
         auto type_without_low_cardinality = getReturnTypeWithoutLowCardinality(args_without_low_cardinality);
 
-        if (canBeExecutedOnLowCardinalityDictionary() && has_low_cardinality
-            && num_full_low_cardinality_columns <= 1 && num_full_ordinary_columns == 0
+        if (canBeExecutedOnLowCardinalityDictionary()
+            && num_full_low_cardinality_columns == 1 && num_full_ordinary_columns == 0
             && type_without_low_cardinality->canBeInsideLowCardinality())
             return std::make_shared<DataTypeLowCardinality>(type_without_low_cardinality);
         else
diff --git a/tests/queries/0_stateless/03032_multi_search_const_low_cardinality.reference b/tests/queries/0_stateless/03032_multi_search_const_low_cardinality.reference
new file mode 100644
index 00000000000..573541ac970
--- /dev/null
+++ b/tests/queries/0_stateless/03032_multi_search_const_low_cardinality.reference
@@ -0,0 +1 @@
+0
diff --git a/tests/queries/0_stateless/03032_multi_search_const_low_cardinality.sql b/tests/queries/0_stateless/03032_multi_search_const_low_cardinality.sql
new file mode 100644
index 00000000000..bc5e5cff15c
--- /dev/null
+++ b/tests/queries/0_stateless/03032_multi_search_const_low_cardinality.sql
@@ -0,0 +1 @@
+SELECT multiSearchFirstIndex(toLowCardinality(''), [toLowCardinality('')])

From 6d3d0cfbcc212f5c874b08ac307d8a35337ea8c3 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Fri, 29 Mar 2024 07:05:01 +0000
Subject: [PATCH 235/289] Revert the type change

---
 src/Functions/IFunction.cpp | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/Functions/IFunction.cpp b/src/Functions/IFunction.cpp
index 847e0c8dd39..21110729ef1 100644
--- a/src/Functions/IFunction.cpp
+++ b/src/Functions/IFunction.cpp
@@ -406,6 +406,7 @@ DataTypePtr IFunctionOverloadResolver::getReturnType(const ColumnsWithTypeAndNam
 {
     if (useDefaultImplementationForLowCardinalityColumns())
     {
+        bool has_low_cardinality = false;
         size_t num_full_low_cardinality_columns = 0;
         size_t num_full_ordinary_columns = 0;
 
@@ -420,6 +421,7 @@ DataTypePtr IFunctionOverloadResolver::getReturnType(const ColumnsWithTypeAndNam
             if (const auto * low_cardinality_type = typeid_cast<const DataTypeLowCardinality *>(arg.type.get()))
             {
                 arg.type = low_cardinality_type->getDictionaryType();
+                has_low_cardinality = true;
 
                 if (!is_const)
                     ++num_full_low_cardinality_columns;
@@ -432,8 +434,8 @@ DataTypePtr IFunctionOverloadResolver::getReturnType(const ColumnsWithTypeAndNam
 
         auto type_without_low_cardinality = getReturnTypeWithoutLowCardinality(args_without_low_cardinality);
 
-        if (canBeExecutedOnLowCardinalityDictionary()
-            && num_full_low_cardinality_columns == 1 && num_full_ordinary_columns == 0
+        if (canBeExecutedOnLowCardinalityDictionary() && has_low_cardinality
+            && num_full_low_cardinality_columns <= 1 && num_full_ordinary_columns == 0
             && type_without_low_cardinality->canBeInsideLowCardinality())
             return std::make_shared<DataTypeLowCardinality>(type_without_low_cardinality);
         else

From c1ea1726b4ffead38a363197bdbc44f5b470cc52 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Sat, 30 Mar 2024 00:35:34 +0000
Subject: [PATCH 236/289] Remove weird special case in if() return type
 inference, to match multiIf()

---
 src/Analyzer/QueryTreePassManager.cpp |  2 +-
 src/Functions/if.cpp                  | 18 +++++++++---------
 2 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/src/Analyzer/QueryTreePassManager.cpp b/src/Analyzer/QueryTreePassManager.cpp
index ae812ac78fd..13a30045607 100644
--- a/src/Analyzer/QueryTreePassManager.cpp
+++ b/src/Analyzer/QueryTreePassManager.cpp
@@ -147,7 +147,7 @@ private:
                     continue;
 
                 throw Exception(ErrorCodes::LOGICAL_ERROR,
-                    "Function {} expects {} argument to have {} type but receives {} after running {} pass",
+                    "Function {} expects argument {} to have {} type but receives {} after running {} pass",
                     function->toAST()->formatForErrorMessage(),
                     i + 1,
                     expected_argument_type->getName(),
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 9766f34edca..abd3f036408 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1278,16 +1278,16 @@ public:
     /// Get result types by argument types. If the function does not apply to these arguments, throw an exception.
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
     {
-        if (arguments[0]->onlyNull())
-            return arguments[2];
+        if (!arguments[0]->onlyNull())
+        {
+            if (arguments[0]->isNullable())
+                return getReturnTypeImpl({
+                    removeNullable(arguments[0]), arguments[1], arguments[2]});
 
-        if (arguments[0]->isNullable())
-            return getReturnTypeImpl({
-                removeNullable(arguments[0]), arguments[1], arguments[2]});
-
-        if (!WhichDataType(arguments[0]).isUInt8())
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument (condition) of function if. "
-                "Must be UInt8.", arguments[0]->getName());
+            if (!WhichDataType(arguments[0]).isUInt8())
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument (condition) of function if. "
+                    "Must be UInt8.", arguments[0]->getName());
+        }
 
         if (use_variant_when_no_common_type)
             return getLeastSupertypeOrVariant(DataTypes{arguments[1], arguments[2]});

From 02fa09dd4cd6024c646252bfa798908d9d37eb45 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Mon, 6 May 2024 21:03:45 +0000
Subject: [PATCH 237/289] Preserve the non-analyzer behavior to fix a test

---
 src/Interpreters/OptimizeIfWithConstantConditionVisitor.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/Interpreters/OptimizeIfWithConstantConditionVisitor.cpp b/src/Interpreters/OptimizeIfWithConstantConditionVisitor.cpp
index f3504f3f403..20451fb20ad 100644
--- a/src/Interpreters/OptimizeIfWithConstantConditionVisitor.cpp
+++ b/src/Interpreters/OptimizeIfWithConstantConditionVisitor.cpp
@@ -27,6 +27,11 @@ static bool tryExtractConstValueFromCondition(const ASTPtr & condition, bool & v
             value = literal->value.get<Int64>();
             return true;
         }
+        if (literal->value.getType() == Field::Types::Null)
+        {
+            value = false;
+            return true;
+        }
     }
 
     /// cast of numeric constant in condition to UInt8

From 0323e4e1780ba7a5efe21718e395404bdde3ead1 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Mon, 6 May 2024 21:12:07 +0000
Subject: [PATCH 238/289] Add 02944_variant_as_common_type_analyzer that is
 just like 02944_variant_as_common_type, but with different expected output

---
 ..._variant_as_common_type_analyzer.reference | 103 ++++++++++++++++++
 .../02944_variant_as_common_type_analyzer.sql |  79 ++++++++++++++
 2 files changed, 182 insertions(+)
 create mode 100644 tests/queries/0_stateless/02944_variant_as_common_type_analyzer.reference
 create mode 100644 tests/queries/0_stateless/02944_variant_as_common_type_analyzer.sql

diff --git a/tests/queries/0_stateless/02944_variant_as_common_type_analyzer.reference b/tests/queries/0_stateless/02944_variant_as_common_type_analyzer.reference
new file mode 100644
index 00000000000..ace28ed7b53
--- /dev/null
+++ b/tests/queries/0_stateless/02944_variant_as_common_type_analyzer.reference
@@ -0,0 +1,103 @@
+Variant(Array(UInt8), String)	[1,2,3]
+Variant(Array(UInt8), String)	[1,2,3]
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	[1,2,3]
+Variant(Array(UInt8), String)	[1,2,3]
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	[1,2,3]
+Variant(Array(UInt8), String)	[1,2,3]
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	[0]
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	[0,1,2]
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	[0]
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	[0,1,2]
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Array(Variant(String, UInt8))	[1,'str_1',2,'str_2']
+Array(Variant(Array(String), Array(UInt8)))	[[1,2,3],['str_1','str_2','str_3']]
+Array(Variant(Array(UInt8), Array(Variant(Array(String), Array(UInt8)))))	[[[1,2,3],['str_1','str_2','str_3']],[1,2,3]]
+Array(Variant(Array(Array(UInt8)), Array(UInt8)))	[[1,2,3],[[1,2,3]]]
+Map(String, Variant(String, UInt8))	{'a':1,'b':'str_1'}
+Map(String, Variant(Map(String, Variant(String, UInt8)), UInt8))	{'a':1,'b':{'c':2,'d':'str_1'}}
+Map(String, Variant(Array(Array(UInt8)), Array(UInt8), UInt8))	{'a':1,'b':[1,2,3],'c':[[4,5,6]]}
diff --git a/tests/queries/0_stateless/02944_variant_as_common_type_analyzer.sql b/tests/queries/0_stateless/02944_variant_as_common_type_analyzer.sql
new file mode 100644
index 00000000000..77bed6cf796
--- /dev/null
+++ b/tests/queries/0_stateless/02944_variant_as_common_type_analyzer.sql
@@ -0,0 +1,79 @@
+-- this test is just like 02944_variant_as_common_type, but with different expected output, because
+-- analyzer changes some return types. Specifically, if(c, x, y) always casts to the common type of
+-- x and y, even if c is constant.
+set allow_experimental_analyzer=1;
+
+set allow_experimental_variant_type=1;
+set use_variant_as_common_type=1;
+
+select toTypeName(res), if(1, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(1, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(0, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(0, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(NULL, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], 'str_1') as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(1, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(1, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(0, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(0, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(NULL, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(1, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(1, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(0, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(0, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(NULL, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+
+select toTypeName(res), if(0, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(0, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(1, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(1, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(NULL, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(NULL, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(number % 2, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::LowCardinality(String)) as res from numbers(4);
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::LowCardinality(Nullable(String))) as res from numbers(4);
+
+
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, 'str_' || toString(number)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number,  ('str_' || toString(number))::Nullable(String)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(String)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(Nullable(String))) as res from numbers(6);
+
+
+select toTypeName(res), array(1, 'str_1', 2, 'str_2') as res;
+select toTypeName(res), array([1, 2, 3], ['str_1', 'str_2', 'str_3']) as res;
+select toTypeName(res), array(array([1, 2, 3], ['str_1', 'str_2', 'str_3']), [1, 2, 3]) as res;
+select toTypeName(res), array([1, 2, 3], [[1, 2, 3]]) as res;
+
+select toTypeName(res), map('a', 1, 'b', 'str_1') as res;
+select toTypeName(res), map('a', 1, 'b', map('c', 2, 'd', 'str_1')) as res;
+select toTypeName(res), map('a', 1, 'b', [1, 2, 3], 'c', [[4, 5, 6]]) as res;
+

From 81e03b861389505ad1cc9c8e64c871ded614954f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 11 May 2024 02:12:17 +0200
Subject: [PATCH 239/289] Fix error

---
 src/Functions/FunctionsHashing.h   | 19 ++++++++-----------
 src/Functions/URL/URLHierarchy.cpp |  2 ++
 2 files changed, 10 insertions(+), 11 deletions(-)

diff --git a/src/Functions/FunctionsHashing.h b/src/Functions/FunctionsHashing.h
index 5b81021be42..683e1ce0819 100644
--- a/src/Functions/FunctionsHashing.h
+++ b/src/Functions/FunctionsHashing.h
@@ -1389,14 +1389,15 @@ struct URLHierarchyHashImpl
             ++pos;
 
         /** We will calculate the hierarchy only for URLs in which there is a protocol, and after it there are two slashes.
-        *    (http, file - fit, mailto, magnet - do not fit), and after two slashes there is still something
-        *    For the rest, simply return the full URL as the only element of the hierarchy.
-        */
+          * (http, file - fit, mailto, magnet - do not fit), and after two slashes there is still something
+          * For the rest, simply return the full URL as the only element of the hierarchy.
+          */
         if (pos == begin || pos == end || !(pos + 3 < end && pos[0] == ':' && pos[1] == '/' && pos[2] == '/'))
         {
-            pos = end;
-            return 0 == level ? pos - begin : 0;
+            return 0 == level ? end - begin : 0;
         }
+        else
+            pos += 3;
 
         /// The domain for simplicity is everything that after the protocol and the two slashes, until the next slash or before `?` or `#`
         while (pos < end && !(*pos == '/' || *pos == '?' || *pos == '#'))
@@ -1518,12 +1519,8 @@ private:
     ColumnPtr executeTwoArgs(const ColumnsWithTypeAndName & arguments) const
     {
         const auto * level_col = arguments.back().column.get();
-        if (!isColumnConst(*level_col))
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Second argument of function {} must be an integral constant", getName());
-
-        const auto level = level_col->get64(0);
-
         const auto * col_untyped = arguments.front().column.get();
+
         if (const auto * col_from = checkAndGetColumn<ColumnString>(col_untyped))
         {
             const auto size = col_from->size();
@@ -1537,7 +1534,7 @@ private:
             for (size_t i = 0; i < size; ++i)
             {
                 out[i] = URLHierarchyHashImpl::apply(
-                    level,
+                    level_col->getUInt(i),
                     reinterpret_cast<const char *>(&chars[current_offset]),
                     offsets[i] - current_offset - 1);
 
diff --git a/src/Functions/URL/URLHierarchy.cpp b/src/Functions/URL/URLHierarchy.cpp
index a1165fbf45e..c08f41f06ee 100644
--- a/src/Functions/URL/URLHierarchy.cpp
+++ b/src/Functions/URL/URLHierarchy.cpp
@@ -72,6 +72,8 @@ public:
                 pos = end;
                 return false;
             }
+            else
+                pos += 3;
 
             /// The domain for simplicity is everything that after the protocol and the two slashes, until the next slash or `?` or `#`
             while (pos < end && !(*pos == '/' || *pos == '?' || *pos == '#'))

From 17b815bcf91c8a293711457ad204cb8eb7751dc3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 11 May 2024 02:38:26 +0200
Subject: [PATCH 240/289] Support for non-constant level in URLHash

---
 src/Functions/FunctionsHashing.h              | 21 +++++++++--
 ...3150_url_hash_non_constant_level.reference | 35 +++++++++++++++++++
 .../03150_url_hash_non_constant_level.sql     |  7 ++++
 3 files changed, 61 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/03150_url_hash_non_constant_level.reference
 create mode 100644 tests/queries/0_stateless/03150_url_hash_non_constant_level.sql

diff --git a/src/Functions/FunctionsHashing.h b/src/Functions/FunctionsHashing.h
index 683e1ce0819..3d8a11319c4 100644
--- a/src/Functions/FunctionsHashing.h
+++ b/src/Functions/FunctionsHashing.h
@@ -1471,7 +1471,6 @@ public:
     }
 
     bool useDefaultImplementationForConstants() const override { return true; }
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/) const override
     {
@@ -1520,10 +1519,10 @@ private:
     {
         const auto * level_col = arguments.back().column.get();
         const auto * col_untyped = arguments.front().column.get();
+        size_t size = col_untyped->size();
 
         if (const auto * col_from = checkAndGetColumn<ColumnString>(col_untyped))
         {
-            const auto size = col_from->size();
             auto col_to = ColumnUInt64::create(size);
 
             const auto & chars = col_from->getChars();
@@ -1543,6 +1542,24 @@ private:
 
             return col_to;
         }
+        else if (const auto * col_const_from = checkAndGetColumnConstData<ColumnString>(col_untyped))
+        {
+            auto col_to = ColumnUInt64::create(size);
+            auto & out = col_to->getData();
+
+            const auto & chars = col_const_from->getChars();
+            const auto & offsets = col_const_from->getOffsets();
+
+            for (size_t i = 0; i < size; ++i)
+            {
+                out[i] = URLHierarchyHashImpl::apply(
+                    level_col->getUInt(i),
+                    reinterpret_cast<const char *>(chars.data()),
+                    offsets[0] - 1);
+            }
+
+            return col_to;
+        }
         else
             throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}",
                 arguments[0].column->getName(), getName());
diff --git a/tests/queries/0_stateless/03150_url_hash_non_constant_level.reference b/tests/queries/0_stateless/03150_url_hash_non_constant_level.reference
new file mode 100644
index 00000000000..21809584f4f
--- /dev/null
+++ b/tests/queries/0_stateless/03150_url_hash_non_constant_level.reference
@@ -0,0 +1,35 @@
+6957009580723342023
+12997754005206516270
+18162116495741479957
+7346166079942937387
+8792485758641698305
+16989076615821526161
+11160318154034397263
+11160318154034397263
+11160318154034397263
+11160318154034397263
+---
+6957009580723342023
+12997754005206516270
+18162116495741479957
+7346166079942937387
+8792485758641698305
+16989076615821526161
+11160318154034397263
+11160318154034397263
+11160318154034397263
+11160318154034397263
+---
+6957009580723342023	https://www3.botinok.co.edu.il/
+12997754005206516270	https://www3.botinok.co.edu.il/~kozlevich/
+18162116495741479957	https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/
+7346166079942937387	https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?
+8792485758641698305	https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?longptr=0xFFFFFFFF&ONERR=CONTINUE#
+16989076615821526161	https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?longptr=0xFFFFFFFF&ONERR=CONTINUE#!PGNUM=99
+---
+6957009580723342023	https://www3.botinok.co.edu.il/
+12997754005206516270	https://www3.botinok.co.edu.il/~kozlevich/
+18162116495741479957	https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/
+7346166079942937387	https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?
+8792485758641698305	https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?longptr=0xFFFFFFFF&ONERR=CONTINUE#
+16989076615821526161	https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?longptr=0xFFFFFFFF&ONERR=CONTINUE#!PGNUM=99
diff --git a/tests/queries/0_stateless/03150_url_hash_non_constant_level.sql b/tests/queries/0_stateless/03150_url_hash_non_constant_level.sql
new file mode 100644
index 00000000000..8afda0f9cfb
--- /dev/null
+++ b/tests/queries/0_stateless/03150_url_hash_non_constant_level.sql
@@ -0,0 +1,7 @@
+WITH 'https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?longptr=0xFFFFFFFF&ONERR=CONTINUE#!PGNUM=99' AS url SELECT URLHash(url, arrayJoin(range(10)));
+SELECT '---';
+WITH 'https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?longptr=0xFFFFFFFF&ONERR=CONTINUE#!PGNUM=99' AS url SELECT URLHash(materialize(url), arrayJoin(range(10)));
+SELECT '---';
+WITH 'https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?longptr=0xFFFFFFFF&ONERR=CONTINUE#!PGNUM=99' AS url SELECT cityHash64(substring(x, -1, 1) IN ('/', '?', '#') ? substring(x, 1, -1) : x), arrayJoin(URLHierarchy(url)) AS x;
+SELECT '---';
+WITH 'https://www3.botinok.co.edu.il/~kozlevich/CGI-BIN/WEBSIT~0.DLL?longptr=0xFFFFFFFF&ONERR=CONTINUE#!PGNUM=99' AS url SELECT cityHash64(substring(x, -1, 1) IN ('/', '?', '#') ? substring(x, 1, -1) : x), arrayJoin(URLHierarchy(materialize(url))) AS x;

From f9d43c9a61a58f96f6fdc505a2215d95400d931c Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Sat, 11 May 2024 10:58:24 +0800
Subject: [PATCH 241/289] fix bugs

---
 src/Functions/substringIndex.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/substringIndex.cpp b/src/Functions/substringIndex.cpp
index 462941b90ec..8d9ecb26d12 100644
--- a/src/Functions/substringIndex.cpp
+++ b/src/Functions/substringIndex.cpp
@@ -220,7 +220,7 @@ namespace
         {
             size_t res_offset = res_data.size();
             res_data.resize(res_offset + res_ref.size + 1);
-            memcpySmallAllowReadWriteOverflow15(&res_data[res_offset], res_ref.data, res_ref.size);
+            memcpy(&res_data[res_offset], res_ref.data, res_ref.size);
             res_offset += res_ref.size;
             res_data[res_offset] = 0;
             ++res_offset;

From dd6774e9fed7ed115b9c7d6ac2c1c0bc93542247 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Sat, 11 May 2024 11:03:51 +0800
Subject: [PATCH 242/289] fix bugs

---
 src/Functions/substringIndex.cpp | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/src/Functions/substringIndex.cpp b/src/Functions/substringIndex.cpp
index 8d9ecb26d12..74474cb4b23 100644
--- a/src/Functions/substringIndex.cpp
+++ b/src/Functions/substringIndex.cpp
@@ -147,7 +147,7 @@ namespace
                 else
                     res_ref = substringIndexUTF8(searcher.get(), str_ref, delim, count);
 
-                appendToResultColumn(res_ref, res_data, res_offsets);
+                appendToResultColumn<true>(res_ref, res_data, res_offsets);
             }
         }
 
@@ -179,7 +179,7 @@ namespace
                 else
                     res_ref = substringIndexUTF8(searcher.get(), str_ref, delim, count);
 
-                appendToResultColumn(res_ref, res_data, res_offsets);
+                appendToResultColumn<true>(res_ref, res_data, res_offsets);
             }
         }
 
@@ -212,15 +212,21 @@ namespace
                 else
                     res_ref = substringIndexUTF8(searcher.get(), str_ref, delim, count);
 
-                appendToResultColumn(res_ref, res_data, res_offsets);
+                appendToResultColumn<false>(res_ref, res_data, res_offsets);
             }
         }
 
+        template <bool padded>
         static void appendToResultColumn(const StringRef & res_ref, ColumnString::Chars & res_data, ColumnString::Offsets & res_offsets)
         {
             size_t res_offset = res_data.size();
             res_data.resize(res_offset + res_ref.size + 1);
-            memcpy(&res_data[res_offset], res_ref.data, res_ref.size);
+
+            if constexpr (padded)
+                memcpySmallAllowReadWriteOverflow15(&res_data[res_offset], res_ref.data, res_ref.size);
+            else
+                memcpy(&res_data[res_offset], res_ref.data, res_ref.size);
+
             res_offset += res_ref.size;
             res_data[res_offset] = 0;
             ++res_offset;

From afe37d60953b211077ab6f75020646b85461df25 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Sat, 11 May 2024 12:22:41 +0200
Subject: [PATCH 243/289] Bring back hmarr/debug-action as agreed in slack

---
 .github/workflows/merge_queue.yml  |  5 ++---
 .github/workflows/pull_request.yml | 10 ++--------
 2 files changed, 4 insertions(+), 11 deletions(-)

diff --git a/.github/workflows/merge_queue.yml b/.github/workflows/merge_queue.yml
index 2b820926651..1b6cc320ec4 100644
--- a/.github/workflows/merge_queue.yml
+++ b/.github/workflows/merge_queue.yml
@@ -14,9 +14,8 @@ jobs:
     outputs:
       data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
-      - name: GH event json
-        run: |
-          cat "$GITHUB_EVENT_PATH" ||:
+      - name: DebugInfo
+        uses: hmarr/debug-action@f7318c783045ac39ed9bb497e22ce835fdafbfe6
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index da34ea0b8e8..a6e369ae0e6 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -20,14 +20,8 @@ jobs:
     outputs:
       data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
-      - name: GH event json
-        run: |
-          echo "::group::GH Env"
-          env | grep GITHUB ||:
-          echo "::endgroup::"
-          echo "::group::Event Json"
-          cat "$GITHUB_EVENT_PATH" ||:
-          echo "::endgroup::"
+      - name: DebugInfo
+        uses: hmarr/debug-action@f7318c783045ac39ed9bb497e22ce835fdafbfe6
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:

From 51818742cbd6248ab7da01138e134413eede2c40 Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Sat, 11 May 2024 13:41:07 +0300
Subject: [PATCH 244/289] Deleted trash log

---
 src/Interpreters/HashJoin.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 8129adbeff9..ce60fa24620 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -947,7 +947,6 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
 
             if (!flag_per_row && !is_inserted)
             {
-                LOG_INFO(log, "LOL\n\n\n\n\n\n");
                 LOG_TRACE(log, "Skipping inserting block with {} rows", rows);
                 data->blocks_allocated_size -= stored_block->allocatedBytes();
                 data->blocks.pop_back();

From c4bb09d55963226e5cf03c7e6fb97093ea44edc9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 11 May 2024 14:15:28 +0200
Subject: [PATCH 245/289] Fix error

---
 .clang-tidy | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.clang-tidy b/.clang-tidy
index 54f54f3fdaa..374259f987f 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -123,7 +123,7 @@ Checks: [
   '-readability-uppercase-literal-suffix',
   '-readability-use-anyofallof',
 
-  '-zircon-*'
+  '-zircon-*',
 
   # These are new in clang-18, and we have to sort them out:
   '-readability-avoid-nested-conditional-operator',

From 65934b56517ece6027c562aa243d085165222a21 Mon Sep 17 00:00:00 2001
From: Ali <115415312+xogoodnow@users.noreply.github.com>
Date: Sat, 11 May 2024 23:16:42 +0330
Subject: [PATCH 246/289] Update clickhouse-test

Fixed a typo
---
 tests/clickhouse-test | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 97459bd5b69..b1ad84b71d4 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -2950,7 +2950,7 @@ def parse_args():
 
     parser.add_argument("--extract_from_config", help="extract-from-config program")
     parser.add_argument(
-        "--configclient", help="Client config (if you use not default ports)"
+        "--configclient", help="Client config (if you do not use default ports)"
     )
     parser.add_argument(
         "--configserver",
@@ -2970,7 +2970,7 @@ def parse_args():
     parser.add_argument(
         "--global_time_limit",
         type=int,
-        help="Stop if executing more than specified time (after current test finished)",
+        help="Stop if executing more than specified time (after current test is finished)",
     )
     parser.add_argument("test", nargs="*", help="Optional test case name regex")
     parser.add_argument(

From 23cf6d0d8bde07e4ef9e42b8d821dbfb3eb786dc Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 11 May 2024 22:51:57 +0200
Subject: [PATCH 247/289] Useless changes

---
 .../AggregateFunctionGroupArray.cpp           |   6 +-
 .../AggregateFunctionGroupArraySorted.cpp     |   4 +-
 .../AggregateFunctionGroupUniqArray.cpp       |  14 +-
 ...ateFunctionLargestTriangleThreeBuckets.cpp |   3 +-
 src/AggregateFunctions/DDSketch.h             |   2 +-
 src/AggregateFunctions/Helpers.h              | 142 +++++++++---------
 .../ReservoirSamplerDeterministic.h           |   3 +-
 src/Analyzer/QueryTreePassManager.cpp         |   2 -
 src/Common/CompactArray.h                     |   3 +-
 .../examples/zkutil_test_commands_new_lib.cpp |   2 +-
 .../examples/thread_creation_latency.cpp      |   3 +-
 src/Dictionaries/PolygonDictionary.cpp        |   4 +-
 .../PolygonDictionaryImplementations.cpp      |   4 +-
 src/Dictionaries/PolygonDictionaryUtils.cpp   |   4 +-
 src/Functions/URL/URLPathHierarchy.cpp        |   4 +-
 src/Functions/array/arrayFold.cpp             |   3 +-
 src/Functions/array/mapOp.cpp                 |   2 +-
 src/Functions/array/range.cpp                 |   2 +-
 src/Functions/makeDate.cpp                    |   2 +-
 src/Functions/mathConstants.cpp               |   7 +-
 src/Functions/padString.cpp                   |   3 +-
 src/Functions/pointInPolygon.cpp              |   6 +-
 src/Functions/polygonArea.cpp                 |  10 +-
 src/Functions/polygonConvexHull.cpp           |  11 +-
 src/Functions/polygonPerimeter.cpp            |   9 +-
 src/Functions/polygonsDistance.cpp            |  10 +-
 src/Functions/polygonsEquals.cpp              |   3 +
 src/Functions/polygonsIntersection.cpp        |  11 +-
 src/Functions/polygonsSymDifference.cpp       |   9 +-
 src/Functions/polygonsUnion.cpp               |   4 +-
 src/Functions/polygonsWithin.cpp              |   9 +-
 src/Functions/readWkt.cpp                     |   3 +
 src/Functions/svg.cpp                         |   3 +
 src/Functions/wkt.cpp                         |   3 +
 src/IO/examples/read_write_int.cpp            |   4 +-
 src/Loggers/Loggers.cpp                       |  29 +---
 src/Storages/examples/merge_selector.cpp      |   3 +-
 src/Storages/examples/merge_selector2.cpp     |   3 +-
 38 files changed, 157 insertions(+), 192 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
index f90e0af6afd..2b1e1a7c339 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
@@ -735,14 +735,14 @@ IAggregateFunction * createWithNumericOrTimeType(const IDataType & argument_type
 template <typename Trait, typename ... TArgs>
 inline AggregateFunctionPtr createAggregateFunctionGroupArrayImpl(const DataTypePtr & argument_type, const Array & parameters, TArgs ... args)
 {
-    if (auto res = createWithNumericOrTimeType<GroupArrayNumericImpl, Trait>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
+    if (auto res = createWithNumericOrTimeType<GroupArrayNumericImpl, Trait>(*argument_type, argument_type, parameters, args...))
         return AggregateFunctionPtr(res);
 
     WhichDataType which(argument_type);
     if (which.idx == TypeIndex::String)
-        return std::make_shared<GroupArrayGeneralImpl<GroupArrayNodeString, Trait>>(argument_type, parameters, std::forward<TArgs>(args)...);
+        return std::make_shared<GroupArrayGeneralImpl<GroupArrayNodeString, Trait>>(argument_type, parameters, args...);
 
-    return std::make_shared<GroupArrayGeneralImpl<GroupArrayNodeGeneral, Trait>>(argument_type, parameters, std::forward<TArgs>(args)...);
+    return std::make_shared<GroupArrayGeneralImpl<GroupArrayNodeGeneral, Trait>>(argument_type, parameters, args...);
 }
 
 size_t getMaxArraySize()
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index acf4646b6ab..d41d743e17a 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -374,10 +374,10 @@ AggregateFunctionPtr createWithNumericOrTimeType(const IDataType & argument_type
 template <template <typename> class AggregateFunctionTemplate, typename ... TArgs>
 inline AggregateFunctionPtr createAggregateFunctionGroupArraySortedImpl(const DataTypePtr & argument_type, const Array & parameters, TArgs ... args)
 {
-    if (auto res = createWithNumericOrTimeType<AggregateFunctionTemplate>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
+    if (auto res = createWithNumericOrTimeType<AggregateFunctionTemplate>(*argument_type, argument_type, parameters, args...))
         return AggregateFunctionPtr(res);
 
-    return std::make_shared<AggregateFunctionTemplate<Field>>(argument_type, parameters, std::forward<TArgs>(args)...);
+    return std::make_shared<AggregateFunctionTemplate<Field>>(argument_type, parameters, args...);
 }
 
 AggregateFunctionPtr createAggregateFunctionGroupArray(
diff --git a/src/AggregateFunctions/AggregateFunctionGroupUniqArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupUniqArray.cpp
index b2431be89d6..7b4300b3568 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupUniqArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupUniqArray.cpp
@@ -275,16 +275,16 @@ template <typename HasLimit, typename ... TArgs>
 IAggregateFunction * createWithExtraTypes(const DataTypePtr & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
-    if (which.idx == TypeIndex::Date) return new AggregateFunctionGroupUniqArrayDate<HasLimit>(argument_type, std::forward<TArgs>(args)...);
-    else if (which.idx == TypeIndex::DateTime) return new AggregateFunctionGroupUniqArrayDateTime<HasLimit>(argument_type, std::forward<TArgs>(args)...);
-    else if (which.idx == TypeIndex::IPv4) return new AggregateFunctionGroupUniqArrayIPv4<HasLimit>(argument_type, std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Date) return new AggregateFunctionGroupUniqArrayDate<HasLimit>(argument_type, args...);
+    else if (which.idx == TypeIndex::DateTime) return new AggregateFunctionGroupUniqArrayDateTime<HasLimit>(argument_type, args...);
+    else if (which.idx == TypeIndex::IPv4) return new AggregateFunctionGroupUniqArrayIPv4<HasLimit>(argument_type, args...);
     else
     {
         /// Check that we can use plain version of AggregateFunctionGroupUniqArrayGeneric
         if (argument_type->isValueUnambiguouslyRepresentedInContiguousMemoryRegion())
-            return new AggregateFunctionGroupUniqArrayGeneric<true, HasLimit>(argument_type, std::forward<TArgs>(args)...);
+            return new AggregateFunctionGroupUniqArrayGeneric<true, HasLimit>(argument_type, args...);
         else
-            return new AggregateFunctionGroupUniqArrayGeneric<false, HasLimit>(argument_type, std::forward<TArgs>(args)...);
+            return new AggregateFunctionGroupUniqArrayGeneric<false, HasLimit>(argument_type, args...);
     }
 }
 
@@ -292,10 +292,10 @@ template <typename HasLimit, typename ... TArgs>
 inline AggregateFunctionPtr createAggregateFunctionGroupUniqArrayImpl(const std::string & name, const DataTypePtr & argument_type, TArgs ... args)
 {
 
-    AggregateFunctionPtr res(createWithNumericType<AggregateFunctionGroupUniqArray, HasLimit, const DataTypePtr &, TArgs...>(*argument_type, argument_type, std::forward<TArgs>(args)...));
+    AggregateFunctionPtr res(createWithNumericType<AggregateFunctionGroupUniqArray, HasLimit, const DataTypePtr &>(*argument_type, argument_type, args...));
 
     if (!res)
-        res = AggregateFunctionPtr(createWithExtraTypes<HasLimit>(argument_type, std::forward<TArgs>(args)...));
+        res = AggregateFunctionPtr(createWithExtraTypes<HasLimit>(argument_type, args...));
 
     if (!res)
         throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument for aggregate function {}",
diff --git a/src/AggregateFunctions/AggregateFunctionLargestTriangleThreeBuckets.cpp b/src/AggregateFunctions/AggregateFunctionLargestTriangleThreeBuckets.cpp
index 49e5eb567e3..6d1e3c0f64b 100644
--- a/src/AggregateFunctions/AggregateFunctionLargestTriangleThreeBuckets.cpp
+++ b/src/AggregateFunctions/AggregateFunctionLargestTriangleThreeBuckets.cpp
@@ -120,8 +120,7 @@ struct LargestTriangleThreeBucketsData : public StatisticalSample<Float64, Float
             // the end index of next bucket
             size_t end_index = 1 + static_cast<int>(floor(single_bucket_size * (i + 2)));
             // current bucket is the last bucket
-            if (end_index > this->x.size())
-                end_index = this->x.size();
+            end_index = std::min(end_index, this->x.size());
 
             // Compute the average point in the next bucket
             Float64 avg_x = 0;
diff --git a/src/AggregateFunctions/DDSketch.h b/src/AggregateFunctions/DDSketch.h
index dae935bd43d..e921b64989a 100644
--- a/src/AggregateFunctions/DDSketch.h
+++ b/src/AggregateFunctions/DDSketch.h
@@ -200,7 +200,7 @@ public:
             throw Exception(ErrorCodes::INCORRECT_DATA, "Invalid flag for zero count");
         }
         readBinary(zero_count, buf);
-        count = static_cast<Float64>(negative_store->count + zero_count + store->count);
+        count = negative_store->count + zero_count + store->count;
     }
 
     /// NOLINTEND(readability-static-accessed-through-instance)
diff --git a/src/AggregateFunctions/Helpers.h b/src/AggregateFunctions/Helpers.h
index e5cfc3034b0..2b8459b6684 100644
--- a/src/AggregateFunctions/Helpers.h
+++ b/src/AggregateFunctions/Helpers.h
@@ -14,11 +14,11 @@ static IAggregateFunction * createWithNumericType(const IDataType & argument_typ
 {
     WhichDataType which(argument_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE>(args...);
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
-    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8>(args...);
+    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16>(args...);
     return nullptr;
 }
 
@@ -27,11 +27,11 @@ static IAggregateFunction * createWithNumericType(const IDataType & argument_typ
 {
     WhichDataType which(argument_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<Data<TYPE>>(std::forward<TArgs>(args)...); /// NOLINT
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<Data<TYPE>>(args...); /// NOLINT
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
-    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Data<Int8>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Data<Int16>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Data<Int8>>(args...);
+    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Data<Int16>>(args...);
     return nullptr;
 }
 
@@ -40,11 +40,11 @@ static IAggregateFunction * createWithNumericType(const IDataType & argument_typ
 {
     WhichDataType which(argument_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE, bool_param>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE, bool_param>(args...);
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
-    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8, bool_param>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16, bool_param>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8, bool_param>(args...);
+    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16, bool_param>(args...);
     return nullptr;
 }
 
@@ -53,11 +53,11 @@ static IAggregateFunction * createWithNumericType(const IDataType & argument_typ
 {
     WhichDataType which(argument_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE, Data>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE, Data>(args...);
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
-    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8, Data>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16, Data>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8, Data>(args...);
+    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16, Data>(args...);
     return nullptr;
 }
 
@@ -66,11 +66,11 @@ static IAggregateFunction * createWithNumericType(const IDataType & argument_typ
 {
     WhichDataType which(argument_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE, Data<TYPE>>(std::forward<TArgs>(args)...); /// NOLINT
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE, Data<TYPE>>(args...); /// NOLINT
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
-    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8, Data<Int8>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16, Data<Int16>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8, Data<Int8>>(args...);
+    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16, Data<Int16>>(args...);
     return nullptr;
 }
 
@@ -79,11 +79,11 @@ static IAggregateFunction * createWithNumericType(const IDataType & argument_typ
 {
     WhichDataType which(argument_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE, Data<TYPE, bool_param>>(std::forward<TArgs>(args)...); /// NOLINT
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<TYPE, Data<TYPE, bool_param>>(args...); /// NOLINT
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
-    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8, Data<Int8, bool_param>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16, Data<Int16, bool_param>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<Int8, Data<Int8, bool_param>>(args...);
+    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<Int16, Data<Int16, bool_param>>(args...);
     return nullptr;
 }
 
@@ -91,12 +91,12 @@ template <template <typename, typename> class AggregateFunctionTemplate, templat
 static IAggregateFunction * createWithUnsignedIntegerType(const IDataType & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
-    if (which.idx == TypeIndex::UInt8) return new AggregateFunctionTemplate<UInt8, Data<UInt8>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::UInt16) return new AggregateFunctionTemplate<UInt16, Data<UInt16>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::UInt32) return new AggregateFunctionTemplate<UInt32, Data<UInt32>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::UInt64) return new AggregateFunctionTemplate<UInt64, Data<UInt64>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::UInt128) return new AggregateFunctionTemplate<UInt128, Data<UInt128>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::UInt256) return new AggregateFunctionTemplate<UInt256, Data<UInt256>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::UInt8) return new AggregateFunctionTemplate<UInt8, Data<UInt8>>(args...);
+    if (which.idx == TypeIndex::UInt16) return new AggregateFunctionTemplate<UInt16, Data<UInt16>>(args...);
+    if (which.idx == TypeIndex::UInt32) return new AggregateFunctionTemplate<UInt32, Data<UInt32>>(args...);
+    if (which.idx == TypeIndex::UInt64) return new AggregateFunctionTemplate<UInt64, Data<UInt64>>(args...);
+    if (which.idx == TypeIndex::UInt128) return new AggregateFunctionTemplate<UInt128, Data<UInt128>>(args...);
+    if (which.idx == TypeIndex::UInt256) return new AggregateFunctionTemplate<UInt256, Data<UInt256>>(args...);
     return nullptr;
 }
 
@@ -104,22 +104,22 @@ template <template <typename, typename> class AggregateFunctionTemplate, templat
 static IAggregateFunction * createWithSignedIntegerType(const IDataType & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
-    if (which.idx == TypeIndex::Int8) return new AggregateFunctionTemplate<Int8, Data<Int8>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Int16) return new AggregateFunctionTemplate<Int16, Data<Int16>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Int32) return new AggregateFunctionTemplate<Int32, Data<Int32>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Int64) return new AggregateFunctionTemplate<Int64, Data<Int64>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Int128) return new AggregateFunctionTemplate<Int128, Data<Int128>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Int256) return new AggregateFunctionTemplate<Int256, Data<Int256>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Int8) return new AggregateFunctionTemplate<Int8, Data<Int8>>(args...);
+    if (which.idx == TypeIndex::Int16) return new AggregateFunctionTemplate<Int16, Data<Int16>>(args...);
+    if (which.idx == TypeIndex::Int32) return new AggregateFunctionTemplate<Int32, Data<Int32>>(args...);
+    if (which.idx == TypeIndex::Int64) return new AggregateFunctionTemplate<Int64, Data<Int64>>(args...);
+    if (which.idx == TypeIndex::Int128) return new AggregateFunctionTemplate<Int128, Data<Int128>>(args...);
+    if (which.idx == TypeIndex::Int256) return new AggregateFunctionTemplate<Int256, Data<Int256>>(args...);
     return nullptr;
 }
 
 template <template <typename, typename> class AggregateFunctionTemplate, template <typename> class Data, typename... TArgs>
 static IAggregateFunction * createWithIntegerType(const IDataType & argument_type, TArgs && ... args)
 {
-    IAggregateFunction * f = createWithUnsignedIntegerType<AggregateFunctionTemplate, Data>(argument_type, std::forward<TArgs>(args)...);
+    IAggregateFunction * f = createWithUnsignedIntegerType<AggregateFunctionTemplate, Data>(argument_type, args...);
     if (f)
         return f;
-    return createWithSignedIntegerType<AggregateFunctionTemplate, Data>(argument_type, std::forward<TArgs>(args)...);
+    return createWithSignedIntegerType<AggregateFunctionTemplate, Data>(argument_type, args...);
 }
 
 template <template <typename, typename> class AggregateFunctionTemplate, template <typename> class Data, typename... TArgs>
@@ -128,14 +128,14 @@ static IAggregateFunction * createWithBasicNumberOrDateOrDateTime(const IDataTyp
     WhichDataType which(argument_type);
 #define DISPATCH(TYPE) \
     if (which.idx == TypeIndex::TYPE) \
-        return new AggregateFunctionTemplate<TYPE, Data<TYPE>>(std::forward<TArgs>(args)...); /// NOLINT
+        return new AggregateFunctionTemplate<TYPE, Data<TYPE>>(args...); /// NOLINT
     FOR_BASIC_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
 
     if (which.idx == TypeIndex::Date)
-        return new AggregateFunctionTemplate<UInt16, Data<UInt16>>(std::forward<TArgs>(args)...);
+        return new AggregateFunctionTemplate<UInt16, Data<UInt16>>(args...);
     if (which.idx == TypeIndex::DateTime)
-        return new AggregateFunctionTemplate<UInt32, Data<UInt32>>(std::forward<TArgs>(args)...);
+        return new AggregateFunctionTemplate<UInt32, Data<UInt32>>(args...);
 
     return nullptr;
 }
@@ -143,17 +143,17 @@ static IAggregateFunction * createWithBasicNumberOrDateOrDateTime(const IDataTyp
 template <template <typename> class AggregateFunctionTemplate, typename... TArgs>
 static IAggregateFunction * createWithNumericBasedType(const IDataType & argument_type, TArgs && ... args)
 {
-    IAggregateFunction * f = createWithNumericType<AggregateFunctionTemplate>(argument_type, std::forward<TArgs>(args)...);
+    IAggregateFunction * f = createWithNumericType<AggregateFunctionTemplate>(argument_type, args...);
     if (f)
         return f;
 
     /// expects that DataTypeDate based on UInt16, DataTypeDateTime based on UInt32
     WhichDataType which(argument_type);
-    if (which.idx == TypeIndex::Date) return new AggregateFunctionTemplate<UInt16>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::DateTime) return new AggregateFunctionTemplate<UInt32>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::UUID) return new AggregateFunctionTemplate<UUID>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::IPv4) return new AggregateFunctionTemplate<IPv4>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::IPv6) return new AggregateFunctionTemplate<IPv6>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Date) return new AggregateFunctionTemplate<UInt16>(args...);
+    if (which.idx == TypeIndex::DateTime) return new AggregateFunctionTemplate<UInt32>(args...);
+    if (which.idx == TypeIndex::UUID) return new AggregateFunctionTemplate<UUID>(args...);
+    if (which.idx == TypeIndex::IPv4) return new AggregateFunctionTemplate<IPv4>(args...);
+    if (which.idx == TypeIndex::IPv6) return new AggregateFunctionTemplate<IPv6>(args...);
     return nullptr;
 }
 
@@ -161,12 +161,12 @@ template <template <typename> class AggregateFunctionTemplate, typename... TArgs
 static IAggregateFunction * createWithDecimalType(const IDataType & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
-    if (which.idx == TypeIndex::Decimal32) return new AggregateFunctionTemplate<Decimal32>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Decimal64) return new AggregateFunctionTemplate<Decimal64>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Decimal128) return new AggregateFunctionTemplate<Decimal128>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Decimal256) return new AggregateFunctionTemplate<Decimal256>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Decimal32) return new AggregateFunctionTemplate<Decimal32>(args...);
+    if (which.idx == TypeIndex::Decimal64) return new AggregateFunctionTemplate<Decimal64>(args...);
+    if (which.idx == TypeIndex::Decimal128) return new AggregateFunctionTemplate<Decimal128>(args...);
+    if (which.idx == TypeIndex::Decimal256) return new AggregateFunctionTemplate<Decimal256>(args...);
     if constexpr (AggregateFunctionTemplate<DateTime64>::DateTime64Supported)
-        if (which.idx == TypeIndex::DateTime64) return new AggregateFunctionTemplate<DateTime64>(std::forward<TArgs>(args)...);
+        if (which.idx == TypeIndex::DateTime64) return new AggregateFunctionTemplate<DateTime64>(args...);
     return nullptr;
 }
 
@@ -174,12 +174,12 @@ template <template <typename, typename> class AggregateFunctionTemplate, typenam
 static IAggregateFunction * createWithDecimalType(const IDataType & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
-    if (which.idx == TypeIndex::Decimal32) return new AggregateFunctionTemplate<Decimal32, Data>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Decimal64) return new AggregateFunctionTemplate<Decimal64, Data>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Decimal128) return new AggregateFunctionTemplate<Decimal128, Data>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Decimal256) return new AggregateFunctionTemplate<Decimal256, Data>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Decimal32) return new AggregateFunctionTemplate<Decimal32, Data>(args...);
+    if (which.idx == TypeIndex::Decimal64) return new AggregateFunctionTemplate<Decimal64, Data>(args...);
+    if (which.idx == TypeIndex::Decimal128) return new AggregateFunctionTemplate<Decimal128, Data>(args...);
+    if (which.idx == TypeIndex::Decimal256) return new AggregateFunctionTemplate<Decimal256, Data>(args...);
     if constexpr (AggregateFunctionTemplate<DateTime64, Data>::DateTime64Supported)
-        if (which.idx == TypeIndex::DateTime64) return new AggregateFunctionTemplate<DateTime64, Data>(std::forward<TArgs>(args)...);
+        if (which.idx == TypeIndex::DateTime64) return new AggregateFunctionTemplate<DateTime64, Data>(args...);
     return nullptr;
 }
 
@@ -190,11 +190,11 @@ static IAggregateFunction * createWithTwoNumericTypesSecond(const IDataType & se
 {
     WhichDataType which(second_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<FirstType, TYPE>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<FirstType, TYPE>(args...);
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
-    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<FirstType, Int8>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<FirstType, Int16>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<FirstType, Int8>(args...);
+    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<FirstType, Int16>(args...);
     return nullptr;
 }
 
@@ -204,13 +204,13 @@ static IAggregateFunction * createWithTwoNumericTypes(const IDataType & first_ty
     WhichDataType which(first_type);
 #define DISPATCH(TYPE) \
     if (which.idx == TypeIndex::TYPE) \
-        return createWithTwoNumericTypesSecond<TYPE, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoNumericTypesSecond<TYPE, AggregateFunctionTemplate>(second_type, args...);
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
     if (which.idx == TypeIndex::Enum8)
-        return createWithTwoNumericTypesSecond<Int8, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoNumericTypesSecond<Int8, AggregateFunctionTemplate>(second_type, args...);
     if (which.idx == TypeIndex::Enum16)
-        return createWithTwoNumericTypesSecond<Int16, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoNumericTypesSecond<Int16, AggregateFunctionTemplate>(second_type, args...);
     return nullptr;
 }
 
@@ -219,7 +219,7 @@ static IAggregateFunction * createWithTwoBasicNumericTypesSecond(const IDataType
 {
     WhichDataType which(second_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<FirstType, TYPE>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<FirstType, TYPE>(args...);
     FOR_BASIC_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
     return nullptr;
@@ -231,7 +231,7 @@ static IAggregateFunction * createWithTwoBasicNumericTypes(const IDataType & fir
     WhichDataType which(first_type);
 #define DISPATCH(TYPE) \
     if (which.idx == TypeIndex::TYPE) \
-        return createWithTwoBasicNumericTypesSecond<TYPE, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoBasicNumericTypesSecond<TYPE, AggregateFunctionTemplate>(second_type, args...);
     FOR_BASIC_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
     return nullptr;
@@ -242,15 +242,15 @@ static IAggregateFunction * createWithTwoNumericOrDateTypesSecond(const IDataTyp
 {
     WhichDataType which(second_type);
 #define DISPATCH(TYPE) \
-    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<FirstType, TYPE>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::TYPE) return new AggregateFunctionTemplate<FirstType, TYPE>(args...);
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
-    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<FirstType, Int8>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<FirstType, Int16>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Enum8) return new AggregateFunctionTemplate<FirstType, Int8>(args...);
+    if (which.idx == TypeIndex::Enum16) return new AggregateFunctionTemplate<FirstType, Int16>(args...);
 
     /// expects that DataTypeDate based on UInt16, DataTypeDateTime based on UInt32
-    if (which.idx == TypeIndex::Date) return new AggregateFunctionTemplate<FirstType, UInt16>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::DateTime) return new AggregateFunctionTemplate<FirstType, UInt32>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::Date) return new AggregateFunctionTemplate<FirstType, UInt16>(args...);
+    if (which.idx == TypeIndex::DateTime) return new AggregateFunctionTemplate<FirstType, UInt32>(args...);
 
     return nullptr;
 }
@@ -261,19 +261,19 @@ static IAggregateFunction * createWithTwoNumericOrDateTypes(const IDataType & fi
     WhichDataType which(first_type);
 #define DISPATCH(TYPE) \
     if (which.idx == TypeIndex::TYPE) \
-        return createWithTwoNumericOrDateTypesSecond<TYPE, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoNumericOrDateTypesSecond<TYPE, AggregateFunctionTemplate>(second_type, args...);
     FOR_NUMERIC_TYPES(DISPATCH)
 #undef DISPATCH
     if (which.idx == TypeIndex::Enum8)
-        return createWithTwoNumericOrDateTypesSecond<Int8, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoNumericOrDateTypesSecond<Int8, AggregateFunctionTemplate>(second_type, args...);
     if (which.idx == TypeIndex::Enum16)
-        return createWithTwoNumericOrDateTypesSecond<Int16, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoNumericOrDateTypesSecond<Int16, AggregateFunctionTemplate>(second_type, args...);
 
     /// expects that DataTypeDate based on UInt16, DataTypeDateTime based on UInt32
     if (which.idx == TypeIndex::Date)
-        return createWithTwoNumericOrDateTypesSecond<UInt16, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoNumericOrDateTypesSecond<UInt16, AggregateFunctionTemplate>(second_type, args...);
     if (which.idx == TypeIndex::DateTime)
-        return createWithTwoNumericOrDateTypesSecond<UInt32, AggregateFunctionTemplate>(second_type, std::forward<TArgs>(args)...);
+        return createWithTwoNumericOrDateTypesSecond<UInt32, AggregateFunctionTemplate>(second_type, args...);
     return nullptr;
 }
 
@@ -281,8 +281,8 @@ template <template <typename> class AggregateFunctionTemplate, typename... TArgs
 static IAggregateFunction * createWithStringType(const IDataType & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
-    if (which.idx == TypeIndex::String) return new AggregateFunctionTemplate<String>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::FixedString) return new AggregateFunctionTemplate<String>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::String) return new AggregateFunctionTemplate<String>(args...);
+    if (which.idx == TypeIndex::FixedString) return new AggregateFunctionTemplate<String>(args...);
     return nullptr;
 }
 
diff --git a/src/AggregateFunctions/ReservoirSamplerDeterministic.h b/src/AggregateFunctions/ReservoirSamplerDeterministic.h
index f3cf2a683ed..38a40c73353 100644
--- a/src/AggregateFunctions/ReservoirSamplerDeterministic.h
+++ b/src/AggregateFunctions/ReservoirSamplerDeterministic.h
@@ -161,8 +161,7 @@ public:
         readBinaryLittleEndian(total_values, buf);
 
         /// Compatibility with old versions.
-        if (size > total_values)
-            size = total_values;
+        size = std::min(size, total_values);
 
         static constexpr size_t MAX_RESERVOIR_SIZE = 1_GiB;
         if (unlikely(size > MAX_RESERVOIR_SIZE))
diff --git a/src/Analyzer/QueryTreePassManager.cpp b/src/Analyzer/QueryTreePassManager.cpp
index 4b714d17fa8..51f1fb6cc2f 100644
--- a/src/Analyzer/QueryTreePassManager.cpp
+++ b/src/Analyzer/QueryTreePassManager.cpp
@@ -290,7 +290,6 @@ void addQueryTreePasses(QueryTreePassManager & manager, bool only_analyze)
 
     manager.addPass(std::make_unique<FuseFunctionsPass>());
 
-
     manager.addPass(std::make_unique<ConvertOrLikeChainPass>());
 
     manager.addPass(std::make_unique<LogicalExpressionOptimizerPass>());
@@ -300,7 +299,6 @@ void addQueryTreePasses(QueryTreePassManager & manager, bool only_analyze)
     manager.addPass(std::make_unique<ShardNumColumnToFunctionPass>());
 
     manager.addPass(std::make_unique<OptimizeDateOrDateTimeConverterWithPreimagePass>());
-
 }
 
 }
diff --git a/src/Common/CompactArray.h b/src/Common/CompactArray.h
index 289b78d7d9a..613dc3d0b90 100644
--- a/src/Common/CompactArray.h
+++ b/src/Common/CompactArray.h
@@ -56,7 +56,7 @@ public:
 
 private:
     /// number of bytes in bitset
-    static constexpr size_t BITSET_SIZE = (static_cast<size_t>(bucket_count) * content_width + 7) / 8;
+    static constexpr size_t BITSET_SIZE = (bucket_count * content_width + 7) / 8;
     UInt8 bitset[BITSET_SIZE] = { 0 };
 };
 
@@ -246,4 +246,3 @@ private:
 };
 
 }
-
diff --git a/src/Common/ZooKeeper/examples/zkutil_test_commands_new_lib.cpp b/src/Common/ZooKeeper/examples/zkutil_test_commands_new_lib.cpp
index 0c5805ea0fc..414006d48a4 100644
--- a/src/Common/ZooKeeper/examples/zkutil_test_commands_new_lib.cpp
+++ b/src/Common/ZooKeeper/examples/zkutil_test_commands_new_lib.cpp
@@ -33,7 +33,7 @@ try
     for (size_t i = 0; i < hosts_strings.size(); ++i)
     {
         std::string host_string = hosts_strings[i];
-        bool secure = bool(startsWith(host_string, "secure://"));
+        bool secure = startsWith(host_string, "secure://");
 
         if (secure)
             host_string.erase(0, strlen("secure://"));
diff --git a/src/Common/examples/thread_creation_latency.cpp b/src/Common/examples/thread_creation_latency.cpp
index d511cab9a0e..48a28488068 100644
--- a/src/Common/examples/thread_creation_latency.cpp
+++ b/src/Common/examples/thread_creation_latency.cpp
@@ -49,8 +49,7 @@ void test(size_t n, const char * name, F && kernel)
         kernel();
 
         watch_one.stop();
-        if (watch_one.elapsedSeconds() > max_seconds)
-            max_seconds = watch_one.elapsedSeconds();
+        max_seconds = std::max(watch_one.elapsedSeconds(), max_seconds);
     }
 
     watch.stop();
diff --git a/src/Dictionaries/PolygonDictionary.cpp b/src/Dictionaries/PolygonDictionary.cpp
index 41c50ef9b63..df0a7c07c5a 100644
--- a/src/Dictionaries/PolygonDictionary.cpp
+++ b/src/Dictionaries/PolygonDictionary.cpp
@@ -1,4 +1,4 @@
-// NOLINTBEGIN
+// NOLINT
 // clang-tidy-19 crashes
 
 #include "PolygonDictionary.h"
@@ -685,5 +685,3 @@ void IPolygonDictionary::extractPolygons(const ColumnPtr & column)
 }
 
 }
-
-// NOLINTEND
diff --git a/src/Dictionaries/PolygonDictionaryImplementations.cpp b/src/Dictionaries/PolygonDictionaryImplementations.cpp
index 317fa481c03..cb916cbd95a 100644
--- a/src/Dictionaries/PolygonDictionaryImplementations.cpp
+++ b/src/Dictionaries/PolygonDictionaryImplementations.cpp
@@ -1,4 +1,4 @@
-// NOLINTBEGIN
+// NOLINT
 // clang-tidy-19 crashes
 
 #include "PolygonDictionaryImplementations.h"
@@ -267,5 +267,3 @@ void registerDictionaryPolygon(DictionaryFactory & factory)
 }
 
 }
-
-// NOLINTEND
diff --git a/src/Dictionaries/PolygonDictionaryUtils.cpp b/src/Dictionaries/PolygonDictionaryUtils.cpp
index 7990f4f77ef..256a4b91b97 100644
--- a/src/Dictionaries/PolygonDictionaryUtils.cpp
+++ b/src/Dictionaries/PolygonDictionaryUtils.cpp
@@ -1,4 +1,4 @@
-// NOLINTBEGIN
+// NOLINT
 // clang-tidy-19 crashes
 
 #include "PolygonDictionaryUtils.h"
@@ -313,5 +313,3 @@ bool SlabsPolygonIndex::find(const Point & point, size_t & id) const
 }
 
 }
-
-// NOLINTEND
diff --git a/src/Functions/URL/URLPathHierarchy.cpp b/src/Functions/URL/URLPathHierarchy.cpp
index 8f546ef6a56..7c796116b8d 100644
--- a/src/Functions/URL/URLPathHierarchy.cpp
+++ b/src/Functions/URL/URLPathHierarchy.cpp
@@ -63,13 +63,15 @@ public:
              * (http, file - fit, mailto, magnet - do not fit), and after two slashes still at least something is there
              * For the rest, simply return the full URL as the only element of the hierarchy.
              */
-            if (pos == begin || pos == end || !(*pos++ == ':' && pos < end && *pos++ == '/' && pos < end && *pos++ == '/' && pos < end))
+            if (pos == begin || pos == end || !(pos + 3 < end && pos[0] == ':' && pos[1] == '/' && pos[2] == '/'))
             {
                 pos = end;
                 token_begin = begin;
                 token_end = end;
                 return true;
             }
+            else
+                pos += 3;
 
             /// The domain for simplicity is everything that after the protocol and two slashes, until the next slash or `?` or `#`
             while (pos < end && !(*pos == '/' || *pos == '?' || *pos == '#'))
diff --git a/src/Functions/array/arrayFold.cpp b/src/Functions/array/arrayFold.cpp
index 5170c9a5b5f..483a5d6404b 100644
--- a/src/Functions/array/arrayFold.cpp
+++ b/src/Functions/array/arrayFold.cpp
@@ -170,8 +170,7 @@ public:
         {
             selector[i] = cur_element_in_cur_array;
             ++cur_element_in_cur_array;
-            if (cur_element_in_cur_array > max_array_size)
-                max_array_size = cur_element_in_cur_array;
+            max_array_size = std::max(cur_element_in_cur_array, max_array_size);
             while (first_row_with_non_empty_array < num_rows && cur_element_in_cur_array >= offsets[first_row_with_non_empty_array] - offsets[first_row_with_non_empty_array - 1])
             {
                 ++first_row_with_non_empty_array;
diff --git a/src/Functions/array/mapOp.cpp b/src/Functions/array/mapOp.cpp
index 6f4b3bc0e2c..86797cb5db0 100644
--- a/src/Functions/array/mapOp.cpp
+++ b/src/Functions/array/mapOp.cpp
@@ -104,7 +104,7 @@ private:
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Each tuple in {} arguments should consist of two arrays",
                     getName());
 
-            auto result_type = v->getNestedType();
+            const auto & result_type = v->getNestedType();
             if (!result_type->canBePromoted())
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Values to be summed are expected to be Numeric, Float or Decimal.");
 
diff --git a/src/Functions/array/range.cpp b/src/Functions/array/range.cpp
index f939ea7b462..1ac698a2745 100644
--- a/src/Functions/array/range.cpp
+++ b/src/Functions/array/range.cpp
@@ -119,7 +119,7 @@ private:
             for (size_t row_idx = 0, rows = in->size(); row_idx < rows; ++row_idx)
             {
                 for (T elem_idx = 0, elems = in_data[row_idx]; elem_idx < elems; ++elem_idx)
-                    out_data[offset + elem_idx] = static_cast<T>(elem_idx);
+                    out_data[offset + elem_idx] = elem_idx;
 
                 offset += in_data[row_idx];
                 out_offsets[row_idx] = offset;
diff --git a/src/Functions/makeDate.cpp b/src/Functions/makeDate.cpp
index 8794283a856..3d8b8617472 100644
--- a/src/Functions/makeDate.cpp
+++ b/src/Functions/makeDate.cpp
@@ -679,7 +679,7 @@ public:
 
         Columns converted_arguments = convertMandatoryArguments<DataTypeFloat64>(arguments, mandatory_argument_names);
 
-        auto res_column = ColumnDateTime64::create(input_rows_count, static_cast<UInt32>(precision));
+        auto res_column = ColumnDateTime64::create(input_rows_count, precision);
         auto & result_data = res_column->getData();
 
         const auto & yyyymmddhhmmss_data = typeid_cast<const ColumnFloat64 &>(*converted_arguments[0]).getData();
diff --git a/src/Functions/mathConstants.cpp b/src/Functions/mathConstants.cpp
index c7eb37289ac..2b199a30616 100644
--- a/src/Functions/mathConstants.cpp
+++ b/src/Functions/mathConstants.cpp
@@ -1,6 +1,9 @@
 #include <Functions/FunctionConstantBase.h>
 #include <DataTypes/DataTypesNumber.h>
 
+#include <numbers>
+
+
 namespace DB
 {
 
@@ -19,7 +22,7 @@ namespace
     struct EImpl
     {
         static constexpr char name[] = "e";
-        static constexpr double value = 2.7182818284590452353602874713526624977572470;
+        static constexpr double value = std::numbers::e;
     };
 
     using FunctionE = FunctionMathConstFloat64<EImpl>;
@@ -28,7 +31,7 @@ namespace
     struct PiImpl
     {
         static constexpr char name[] = "pi";
-        static constexpr double value = 3.1415926535897932384626433832795028841971693;
+        static constexpr double value = std::numbers::pi;
     };
 
     using FunctionPi = FunctionMathConstFloat64<PiImpl>;
diff --git a/src/Functions/padString.cpp b/src/Functions/padString.cpp
index b26a4ec3d6a..ccef87d83e7 100644
--- a/src/Functions/padString.cpp
+++ b/src/Functions/padString.cpp
@@ -84,8 +84,7 @@ namespace
                     if (offset == pad_string.length())
                         break;
                     offset += UTF8::seqLength(pad_string[offset]);
-                    if (offset > pad_string.length())
-                        offset = pad_string.length();
+                    offset = std::min(offset, pad_string.length());
                 }
             }
 
diff --git a/src/Functions/pointInPolygon.cpp b/src/Functions/pointInPolygon.cpp
index 55f89b71d6f..36abf6d21de 100644
--- a/src/Functions/pointInPolygon.cpp
+++ b/src/Functions/pointInPolygon.cpp
@@ -1,3 +1,6 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/PolygonUtils.h>
 #include <Functions/FunctionHelpers.h>
@@ -7,15 +10,12 @@
 #include <boost/geometry/geometries/polygon.hpp>
 
 #include <Columns/ColumnArray.h>
-#include <Columns/ColumnFixedString.h>
-#include <Columns/ColumnString.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnsNumber.h>
 #include <Common/ObjectPool.h>
 #include <Common/ProfileEvents.h>
 #include <base/arithmeticOverflow.h>
 #include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypeTuple.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <IO/WriteHelpers.h>
diff --git a/src/Functions/polygonArea.cpp b/src/Functions/polygonArea.cpp
index 1c4ef9f79a3..858b8007cf3 100644
--- a/src/Functions/polygonArea.cpp
+++ b/src/Functions/polygonArea.cpp
@@ -1,18 +1,14 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
 #include <boost/geometry.hpp>
 #include <boost/geometry/geometries/point_xy.hpp>
-#include <boost/geometry/geometries/polygon.hpp>
 
-#include <Common/logger_useful.h>
-
-#include <Columns/ColumnArray.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnsNumber.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeCustomGeo.h>
 #include <DataTypes/DataTypesNumber.h>
 
 #include <memory>
diff --git a/src/Functions/polygonConvexHull.cpp b/src/Functions/polygonConvexHull.cpp
index 921c0700ca7..3147ae93427 100644
--- a/src/Functions/polygonConvexHull.cpp
+++ b/src/Functions/polygonConvexHull.cpp
@@ -1,18 +1,13 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
 #include <boost/geometry.hpp>
 #include <boost/geometry/geometries/point_xy.hpp>
-#include <boost/geometry/geometries/polygon.hpp>
 
-#include <Common/logger_useful.h>
-
-#include <Columns/ColumnArray.h>
 #include <Columns/ColumnTuple.h>
-#include <Columns/ColumnsNumber.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeCustomGeo.h>
 
 #include <memory>
 #include <string>
diff --git a/src/Functions/polygonPerimeter.cpp b/src/Functions/polygonPerimeter.cpp
index 85645118f84..d90a8f56d1c 100644
--- a/src/Functions/polygonPerimeter.cpp
+++ b/src/Functions/polygonPerimeter.cpp
@@ -1,17 +1,14 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
 #include <boost/geometry.hpp>
 #include <boost/geometry/geometries/point_xy.hpp>
-#include <boost/geometry/geometries/polygon.hpp>
 
-#include <Common/logger_useful.h>
-
-#include <Columns/ColumnArray.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnsNumber.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
 #include <DataTypes/DataTypesNumber.h>
 
 #include <memory>
diff --git a/src/Functions/polygonsDistance.cpp b/src/Functions/polygonsDistance.cpp
index d6c7d799b5e..865a11ebf4d 100644
--- a/src/Functions/polygonsDistance.cpp
+++ b/src/Functions/polygonsDistance.cpp
@@ -1,23 +1,21 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
 #include <boost/geometry.hpp>
 #include <boost/geometry/geometries/point_xy.hpp>
-#include <boost/geometry/geometries/polygon.hpp>
 
 #include <Common/logger_useful.h>
 
-#include <Columns/ColumnArray.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnsNumber.h>
 #include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeCustomGeo.h>
 
 #include <memory>
-#include <utility>
+
 
 namespace DB
 {
diff --git a/src/Functions/polygonsEquals.cpp b/src/Functions/polygonsEquals.cpp
index bdc4f18042c..fbd61eaf31e 100644
--- a/src/Functions/polygonsEquals.cpp
+++ b/src/Functions/polygonsEquals.cpp
@@ -1,3 +1,6 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonsIntersection.cpp b/src/Functions/polygonsIntersection.cpp
index 5777f438a19..f2a8284833f 100644
--- a/src/Functions/polygonsIntersection.cpp
+++ b/src/Functions/polygonsIntersection.cpp
@@ -1,22 +1,19 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
 #include <boost/geometry.hpp>
 #include <boost/geometry/geometries/point_xy.hpp>
-#include <boost/geometry/geometries/polygon.hpp>
 
 #include <Common/logger_useful.h>
 
-#include <Columns/ColumnArray.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnConst.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeCustomGeo.h>
 
 #include <memory>
-#include <utility>
-#include <chrono>
+
 
 namespace DB
 {
diff --git a/src/Functions/polygonsSymDifference.cpp b/src/Functions/polygonsSymDifference.cpp
index 785a8f76ba6..a7ec164b49b 100644
--- a/src/Functions/polygonsSymDifference.cpp
+++ b/src/Functions/polygonsSymDifference.cpp
@@ -1,21 +1,18 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
 #include <boost/geometry.hpp>
 #include <boost/geometry/geometries/point_xy.hpp>
-#include <boost/geometry/geometries/polygon.hpp>
 
 #include <Common/logger_useful.h>
 
-#include <Columns/ColumnArray.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnConst.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeCustomGeo.h>
 
 #include <memory>
-#include <utility>
 
 namespace DB
 {
diff --git a/src/Functions/polygonsUnion.cpp b/src/Functions/polygonsUnion.cpp
index a31d223ea8c..1d05eb0bb8a 100644
--- a/src/Functions/polygonsUnion.cpp
+++ b/src/Functions/polygonsUnion.cpp
@@ -1,3 +1,6 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
@@ -7,7 +10,6 @@
 #include <Common/logger_useful.h>
 
 #include <Columns/ColumnTuple.h>
-#include <DataTypes/DataTypeTuple.h>
 
 #include <memory>
 
diff --git a/src/Functions/polygonsWithin.cpp b/src/Functions/polygonsWithin.cpp
index bf4db1cf9f8..a7056a1013a 100644
--- a/src/Functions/polygonsWithin.cpp
+++ b/src/Functions/polygonsWithin.cpp
@@ -1,23 +1,20 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
 #include <boost/geometry.hpp>
 #include <boost/geometry/geometries/point_xy.hpp>
-#include <boost/geometry/geometries/polygon.hpp>
 
 #include <Common/logger_useful.h>
 
-#include <Columns/ColumnArray.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnsNumber.h>
 #include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeCustomGeo.h>
 
 #include <memory>
-#include <utility>
 
 namespace DB
 {
diff --git a/src/Functions/readWkt.cpp b/src/Functions/readWkt.cpp
index ddc847b1ca5..366a444f249 100644
--- a/src/Functions/readWkt.cpp
+++ b/src/Functions/readWkt.cpp
@@ -1,3 +1,6 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypeCustomGeo.h>
 #include <Functions/FunctionFactory.h>
diff --git a/src/Functions/svg.cpp b/src/Functions/svg.cpp
index 550fe29cfc4..810b1d2730c 100644
--- a/src/Functions/svg.cpp
+++ b/src/Functions/svg.cpp
@@ -1,3 +1,6 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
diff --git a/src/Functions/wkt.cpp b/src/Functions/wkt.cpp
index afcfabd0bf4..f6abd7f6f4a 100644
--- a/src/Functions/wkt.cpp
+++ b/src/Functions/wkt.cpp
@@ -1,3 +1,6 @@
+// NOLINT
+// clang-tidy-19 crashes
+
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
diff --git a/src/IO/examples/read_write_int.cpp b/src/IO/examples/read_write_int.cpp
index 49374878790..ef2155731bf 100644
--- a/src/IO/examples/read_write_int.cpp
+++ b/src/IO/examples/read_write_int.cpp
@@ -17,7 +17,7 @@ int main(int, char **)
         Int64 x2 = 0;
         std::string s;
 
-        std::cerr << static_cast<Int64>(x1) << std::endl;
+        std::cerr << x1 << std::endl;
 
         {
             DB::WriteBufferFromString wb(s);
@@ -31,7 +31,7 @@ int main(int, char **)
             DB::readIntText(x2, rb);
         }
 
-        std::cerr << static_cast<Int64>(x2) << std::endl;
+        std::cerr << x2 << std::endl;
     }
     catch (const DB::Exception & e)
     {
diff --git a/src/Loggers/Loggers.cpp b/src/Loggers/Loggers.cpp
index f794ad336e2..4b17469f4d7 100644
--- a/src/Loggers/Loggers.cpp
+++ b/src/Loggers/Loggers.cpp
@@ -90,10 +90,7 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
         std::cerr << "Logging " << log_level_string << " to " << log_path << ext << std::endl;
 
         auto log_level = Poco::Logger::parseLevel(log_level_string);
-        if (log_level > max_log_level)
-        {
-            max_log_level = log_level;
-        }
+        max_log_level = std::max(log_level, max_log_level);
 
         // Set up two channel chains.
         log_file = new Poco::FileChannel;
@@ -128,10 +125,7 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
         // NOTE: we don't use notice & critical in the code, so in practice error log collects fatal & error & warning.
         // (!) Warnings are important, they require attention and should never be silenced / ignored.
         auto errorlog_level = Poco::Logger::parseLevel(config.getString("logger.errorlog_level", "notice"));
-        if (errorlog_level > max_log_level)
-        {
-            max_log_level = errorlog_level;
-        }
+        max_log_level = std::max(errorlog_level, max_log_level);
 
         std::string ext;
         if (config.getRawString("logger.stream_compress", "false") == "true")
@@ -165,10 +159,7 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
     if (config.getBool("logger.use_syslog", false))
     {
         auto syslog_level = Poco::Logger::parseLevel(config.getString("logger.syslog_level", log_level_string));
-        if (syslog_level > max_log_level)
-        {
-            max_log_level = syslog_level;
-        }
+        max_log_level = std::max(syslog_level, max_log_level);
 
         if (config.has("logger.syslog.address"))
         {
@@ -215,10 +206,7 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
 
         auto console_log_level_string = config.getString("logger.console_log_level", log_level_string);
         auto console_log_level = Poco::Logger::parseLevel(console_log_level_string);
-        if (console_log_level > max_log_level)
-        {
-            max_log_level = console_log_level;
-        }
+        max_log_level = std::max(console_log_level, max_log_level);
 
         Poco::AutoPtr<OwnPatternFormatter> pf;
         if (config.getString("logger.formatting.type", "") == "json")
@@ -323,8 +311,7 @@ void Loggers::updateLevels(Poco::Util::AbstractConfiguration & config, Poco::Log
 
     const auto log_level_string = config.getString("logger.level", "trace");
     int log_level = Poco::Logger::parseLevel(log_level_string);
-    if (log_level > max_log_level)
-        max_log_level = log_level;
+    max_log_level = std::max(log_level, max_log_level);
 
     if (log_file)
         split->setLevel("log", log_level);
@@ -342,8 +329,7 @@ void Loggers::updateLevels(Poco::Util::AbstractConfiguration & config, Poco::Log
     if (error_log_file)
     {
         int errorlog_level = Poco::Logger::parseLevel(config.getString("logger.errorlog_level", "notice"));
-        if (errorlog_level > max_log_level)
-            max_log_level = errorlog_level;
+        max_log_level = std::max(errorlog_level, max_log_level);
         split->setLevel("errorlog", errorlog_level);
     }
 
@@ -352,8 +338,7 @@ void Loggers::updateLevels(Poco::Util::AbstractConfiguration & config, Poco::Log
     if (config.getBool("logger.use_syslog", false))
     {
         syslog_level = Poco::Logger::parseLevel(config.getString("logger.syslog_level", log_level_string));
-        if (syslog_level > max_log_level)
-            max_log_level = syslog_level;
+        max_log_level = std::max(syslog_level, max_log_level);
     }
     split->setLevel("syslog", syslog_level);
 
diff --git a/src/Storages/examples/merge_selector.cpp b/src/Storages/examples/merge_selector.cpp
index a3b0d8a29ef..a60d1ce402c 100644
--- a/src/Storages/examples/merge_selector.cpp
+++ b/src/Storages/examples/merge_selector.cpp
@@ -82,8 +82,7 @@ int main(int, char **)
             if (in_range)
             {
                 sum_merged_size += parts[i].size;
-                if (parts[i].level > max_level)
-                    max_level = parts[i].level;
+                max_level = std::max(parts[i].level, max_level);
             }
 
             if (parts[i].data == selected_parts.back().data)
diff --git a/src/Storages/examples/merge_selector2.cpp b/src/Storages/examples/merge_selector2.cpp
index 5d5ad3857cf..49cbb892dda 100644
--- a/src/Storages/examples/merge_selector2.cpp
+++ b/src/Storages/examples/merge_selector2.cpp
@@ -84,8 +84,7 @@ int main(int, char **)
             if (in_range)
             {
                 sum_merged_size += parts[i].size;
-                if (parts[i].level > max_level)
-                    max_level = parts[i].level;
+                max_level = std::max(parts[i].level, max_level);
             }
 
             if (parts[i].data == selected_parts.back().data)

From 258eb72c8a803d649a3a05ec18d08be9fa263d80 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 12 May 2024 01:48:03 +0200
Subject: [PATCH 248/289] Useless changes

---
 .clang-tidy                                           | 3 +++
 src/Dictionaries/PolygonDictionary.cpp                | 3 ---
 src/Dictionaries/PolygonDictionaryImplementations.cpp | 4 ----
 src/Dictionaries/PolygonDictionaryUtils.cpp           | 3 ---
 src/Functions/pointInPolygon.cpp                      | 3 ---
 src/Functions/polygonArea.cpp                         | 3 ---
 src/Functions/polygonConvexHull.cpp                   | 3 ---
 src/Functions/polygonPerimeter.cpp                    | 3 ---
 src/Functions/polygonsDistance.cpp                    | 3 ---
 src/Functions/polygonsEquals.cpp                      | 3 ---
 src/Functions/polygonsIntersection.cpp                | 3 ---
 src/Functions/polygonsSymDifference.cpp               | 3 ---
 src/Functions/polygonsUnion.cpp                       | 3 ---
 src/Functions/polygonsWithin.cpp                      | 3 ---
 src/Functions/readWkt.cpp                             | 3 ---
 src/Functions/svg.cpp                                 | 3 ---
 src/Functions/wkt.cpp                                 | 3 ---
 17 files changed, 3 insertions(+), 49 deletions(-)

diff --git a/.clang-tidy b/.clang-tidy
index 374259f987f..d53047f0552 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -135,6 +135,9 @@ Checks: [
   '-bugprone-suspicious-stringview-data-usage',
   '-bugprone-multi-level-implicit-pointer-conversion',
   '-cert-err33-c',
+
+  # This is a good check, but clang-tidy crashes, see https://github.com/llvm/llvm-project/issues/91872
+  '-modernize-use-constraints',
 ]
 
 WarningsAsErrors: '*'
diff --git a/src/Dictionaries/PolygonDictionary.cpp b/src/Dictionaries/PolygonDictionary.cpp
index df0a7c07c5a..1456a0db750 100644
--- a/src/Dictionaries/PolygonDictionary.cpp
+++ b/src/Dictionaries/PolygonDictionary.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include "PolygonDictionary.h"
 
 #include <cmath>
diff --git a/src/Dictionaries/PolygonDictionaryImplementations.cpp b/src/Dictionaries/PolygonDictionaryImplementations.cpp
index cb916cbd95a..e21fadb0e7e 100644
--- a/src/Dictionaries/PolygonDictionaryImplementations.cpp
+++ b/src/Dictionaries/PolygonDictionaryImplementations.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include "PolygonDictionaryImplementations.h"
 #include "DictionaryFactory.h"
 
@@ -169,7 +166,6 @@ DictionaryPtr createLayout(const std::string & ,
                            ContextPtr global_context,
                            bool /*created_from_ddl*/)
 {
-    const String database = config.getString(config_prefix + ".database", "");
     const String name = config.getString(config_prefix + ".name");
 
     if (!dict_struct.key)
diff --git a/src/Dictionaries/PolygonDictionaryUtils.cpp b/src/Dictionaries/PolygonDictionaryUtils.cpp
index 256a4b91b97..3fd1f4808a6 100644
--- a/src/Dictionaries/PolygonDictionaryUtils.cpp
+++ b/src/Dictionaries/PolygonDictionaryUtils.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include "PolygonDictionaryUtils.h"
 
 #include <Common/ThreadPool.h>
diff --git a/src/Functions/pointInPolygon.cpp b/src/Functions/pointInPolygon.cpp
index 36abf6d21de..6b413829bd1 100644
--- a/src/Functions/pointInPolygon.cpp
+++ b/src/Functions/pointInPolygon.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/PolygonUtils.h>
 #include <Functions/FunctionHelpers.h>
diff --git a/src/Functions/polygonArea.cpp b/src/Functions/polygonArea.cpp
index 858b8007cf3..facb37619ff 100644
--- a/src/Functions/polygonArea.cpp
+++ b/src/Functions/polygonArea.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonConvexHull.cpp b/src/Functions/polygonConvexHull.cpp
index 3147ae93427..f19589bcc07 100644
--- a/src/Functions/polygonConvexHull.cpp
+++ b/src/Functions/polygonConvexHull.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonPerimeter.cpp b/src/Functions/polygonPerimeter.cpp
index d90a8f56d1c..0a255cec34b 100644
--- a/src/Functions/polygonPerimeter.cpp
+++ b/src/Functions/polygonPerimeter.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonsDistance.cpp b/src/Functions/polygonsDistance.cpp
index 865a11ebf4d..fdf1ef34ea6 100644
--- a/src/Functions/polygonsDistance.cpp
+++ b/src/Functions/polygonsDistance.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonsEquals.cpp b/src/Functions/polygonsEquals.cpp
index fbd61eaf31e..bdc4f18042c 100644
--- a/src/Functions/polygonsEquals.cpp
+++ b/src/Functions/polygonsEquals.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonsIntersection.cpp b/src/Functions/polygonsIntersection.cpp
index f2a8284833f..77484e7e63c 100644
--- a/src/Functions/polygonsIntersection.cpp
+++ b/src/Functions/polygonsIntersection.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonsSymDifference.cpp b/src/Functions/polygonsSymDifference.cpp
index a7ec164b49b..194b7f2cfd7 100644
--- a/src/Functions/polygonsSymDifference.cpp
+++ b/src/Functions/polygonsSymDifference.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonsUnion.cpp b/src/Functions/polygonsUnion.cpp
index 1d05eb0bb8a..37d865af50a 100644
--- a/src/Functions/polygonsUnion.cpp
+++ b/src/Functions/polygonsUnion.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/polygonsWithin.cpp b/src/Functions/polygonsWithin.cpp
index a7056a1013a..35a9e17cdfd 100644
--- a/src/Functions/polygonsWithin.cpp
+++ b/src/Functions/polygonsWithin.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>
 
diff --git a/src/Functions/readWkt.cpp b/src/Functions/readWkt.cpp
index 366a444f249..ddc847b1ca5 100644
--- a/src/Functions/readWkt.cpp
+++ b/src/Functions/readWkt.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypeCustomGeo.h>
 #include <Functions/FunctionFactory.h>
diff --git a/src/Functions/svg.cpp b/src/Functions/svg.cpp
index 810b1d2730c..550fe29cfc4 100644
--- a/src/Functions/svg.cpp
+++ b/src/Functions/svg.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
diff --git a/src/Functions/wkt.cpp b/src/Functions/wkt.cpp
index f6abd7f6f4a..afcfabd0bf4 100644
--- a/src/Functions/wkt.cpp
+++ b/src/Functions/wkt.cpp
@@ -1,6 +1,3 @@
-// NOLINT
-// clang-tidy-19 crashes
-
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/geometryConverters.h>

From 24bddeedf9479df7c841a630f54242b769ca8ca5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 12 May 2024 18:22:09 +0200
Subject: [PATCH 249/289] Useless changes

---
 src/Common/FST.h                  | 2 ++
 utils/keeper-data-dumper/main.cpp | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/src/Common/FST.h b/src/Common/FST.h
index e5dcea2c8d8..cbf2367524a 100644
--- a/src/Common/FST.h
+++ b/src/Common/FST.h
@@ -173,3 +173,5 @@ private:
 };
 }
 }
+
+// NOLINTEND(clang-analyzer-optin.core.EnumCastOutOfRange)
diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index 21626665a42..ee50e9780e2 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -1,3 +1,5 @@
+// NOLINTBEGIN(clang-analyzer-optin.core.EnumCastOutOfRange)
+
 #include <Poco/ConsoleChannel.h>
 #include <Poco/Logger.h>
 #include <Coordination/KeeperStateMachine.h>

From c44e42dd7a7ee8cfb3ed15f4d7001e0ab1f44e9c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 12 May 2024 18:22:41 +0200
Subject: [PATCH 250/289] Useless changes

---
 src/Common/FST.h | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Common/FST.h b/src/Common/FST.h
index cbf2367524a..e5dcea2c8d8 100644
--- a/src/Common/FST.h
+++ b/src/Common/FST.h
@@ -173,5 +173,3 @@ private:
 };
 }
 }
-
-// NOLINTEND(clang-analyzer-optin.core.EnumCastOutOfRange)

From bf0040f383cd18b57748c4e2deb9514db9711909 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 12 May 2024 18:48:05 +0200
Subject: [PATCH 251/289] Debug a test

---
 tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh b/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
index 9b647ec984b..5dd5e8c4030 100755
--- a/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
+++ b/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
@@ -11,4 +11,4 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Also note, that to rely on this test one should assume that CI packages uses
 # ThinLTO builds.
 
-$CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)' |& grep -c 'Common/Exception.cpp:[0-9]*: DB::Exception::Exception'
+$CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)' |& grep -c 'Common/Exception.cpp:[0-9]*: DB::Exception::Exception' || $CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)'

From bf31d12dc8e459cac63906a5fe84d127055ec5d6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 12 May 2024 18:54:57 +0200
Subject: [PATCH 252/289] Fix bad test `02950_part_log_bytes_uncompressed`

---
 tests/queries/0_stateless/02950_part_log_bytes_uncompressed.sql | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.sql b/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.sql
index 0c2cef6e004..248475ab84b 100644
--- a/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.sql
+++ b/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.sql
@@ -19,6 +19,7 @@ SYSTEM FLUSH LOGS;
 
 SELECT event_type, table, part_name, bytes_uncompressed > 0, size_in_bytes < bytes_uncompressed FROM system.part_log
 WHERE event_date >= yesterday() AND database = currentDatabase() AND table = 'part_log_bytes_uncompressed'
+    AND (event_type != 'RemovePart' OR part_name = 'all_4_4_0') -- ignore removal of other parts
 ORDER BY part_name, event_type;
 
 DROP TABLE part_log_bytes_uncompressed;

From 68d9e55302261822285ef58ab482f70d79e93808 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Sun, 12 May 2024 20:38:43 +0100
Subject: [PATCH 253/289] impl

---
 src/Interpreters/MonotonicityCheckVisitor.h | 157 --------------------
 src/Interpreters/TreeOptimizer.cpp          |   1 -
 2 files changed, 158 deletions(-)
 delete mode 100644 src/Interpreters/MonotonicityCheckVisitor.h

diff --git a/src/Interpreters/MonotonicityCheckVisitor.h b/src/Interpreters/MonotonicityCheckVisitor.h
deleted file mode 100644
index e1df45ed36b..00000000000
--- a/src/Interpreters/MonotonicityCheckVisitor.h
+++ /dev/null
@@ -1,157 +0,0 @@
-#pragma once
-
-#include <AggregateFunctions/AggregateFunctionFactory.h>
-#include <DataTypes/DataTypeFactory.h>
-#include <Functions/FunctionFactory.h>
-#include <IO/WriteHelpers.h>
-#include <Interpreters/InDepthNodeVisitor.h>
-#include <Interpreters/IdentifierSemantic.h>
-#include <Parsers/ASTFunction.h>
-#include <Parsers/ASTIdentifier.h>
-#include <Parsers/ASTOrderByElement.h>
-#include <Parsers/ASTTablesInSelectQuery.h>
-#include <Parsers/IAST.h>
-#include <Common/typeid_cast.h>
-
-namespace DB
-{
-
-using Monotonicity = IFunctionBase::Monotonicity;
-
-/// Checks from bottom to top if function composition is monotonous
-class MonotonicityCheckMatcher
-{
-public:
-    struct Data
-    {
-        const TablesWithColumns & tables;
-        ContextPtr context;
-        const std::unordered_set<String> & group_by_function_hashes;
-
-        Monotonicity monotonicity = { .is_monotonic = true, .is_positive = true, .is_always_monotonic = true };
-
-        ASTIdentifier * identifier = nullptr;
-        DataTypePtr arg_data_type = {};
-
-        void reject() { monotonicity.is_monotonic = false; }
-        bool isRejected() const { return !monotonicity.is_monotonic; }
-
-        bool canOptimize(const ASTFunction & ast_function) const
-        {
-            /// if GROUP BY contains the same function ORDER BY shouldn't be optimized
-            const auto hash = ast_function.getTreeHash(/*ignore_aliases=*/ true);
-            const auto key = toString(hash);
-            if (group_by_function_hashes.contains(key))
-                return false;
-
-            /// if ORDER BY contains aggregate function or window functions, it
-            /// shouldn't be optimized
-            if (ast_function.is_window_function
-                || AggregateUtils::isAggregateFunction(ast_function))
-            {
-                return false;
-            }
-
-            return true;
-        }
-
-        bool extractIdentifierAndType(const ASTFunction & ast_function)
-        {
-            if (identifier)
-                return true;
-
-            identifier = ast_function.arguments->children[0]->as<ASTIdentifier>();
-            if (!identifier)
-                return false;
-
-            auto pos = IdentifierSemantic::getMembership(*identifier);
-            if (!pos)
-                pos = IdentifierSemantic::chooseTableColumnMatch(*identifier, tables, true);
-            if (!pos)
-                return false;
-
-            /// It is possible that tables list is empty.
-            /// IdentifierSemantic get the position from AST, and it can be not valid to use it.
-            /// Example is re-analysing a part of AST for storage Merge, see 02147_order_by_optimizations.sql
-            if (*pos >= tables.size())
-                return false;
-
-            if (auto data_type_and_name = tables[*pos].columns.tryGetByName(identifier->shortName()))
-            {
-                arg_data_type = data_type_and_name->type;
-                return true;
-            }
-
-            return false;
-        }
-    };
-
-    static void visit(const ASTPtr & ast, Data & data)
-    {
-        if (const auto * ast_function = ast->as<ASTFunction>())
-            visit(*ast_function, data);
-    }
-
-    static void visit(const ASTFunction & ast_function, Data & data)
-    {
-        if (data.isRejected())
-            return;
-
-        /// TODO: monotonicity for functions of several arguments
-        if (!ast_function.arguments || ast_function.arguments->children.size() != 1)
-        {
-            data.reject();
-            return;
-        }
-
-        if (!data.canOptimize(ast_function))
-        {
-            data.reject();
-            return;
-        }
-
-        const auto & function = FunctionFactory::instance().tryGet(ast_function.name, data.context);
-        if (!function)
-        {
-            data.reject();
-            return;
-        }
-
-        /// First time extract the most enclosed identifier and its data type
-        if (!data.arg_data_type && !data.extractIdentifierAndType(ast_function))
-        {
-            data.reject();
-            return;
-        }
-
-        ColumnsWithTypeAndName args;
-        args.emplace_back(data.arg_data_type, "tmp");
-        auto function_base = function->build(args);
-
-        if (function_base && function_base->hasInformationAboutMonotonicity())
-        {
-            bool is_positive = data.monotonicity.is_positive;
-            data.monotonicity = function_base->getMonotonicityForRange(*data.arg_data_type, Field(), Field());
-
-            if (!is_positive)
-                data.monotonicity.is_positive = !data.monotonicity.is_positive;
-            data.arg_data_type = function_base->getResultType();
-        }
-        else
-            data.reject();
-    }
-
-    static bool needChildVisit(const ASTPtr & parent, const ASTPtr &)
-    {
-        /// Currently we check monotonicity only for single-argument functions.
-        /// Although, multi-argument functions with all but one constant arguments can also be monotonic.
-        if (const auto * func = typeid_cast<const ASTFunction *>(parent.get()))
-            return func->arguments->children.size() < 2;
-
-        return true;
-    }
-};
-
-using MonotonicityCheckVisitor = ConstInDepthNodeVisitor<MonotonicityCheckMatcher, false>;
-
-}
diff --git a/src/Interpreters/TreeOptimizer.cpp b/src/Interpreters/TreeOptimizer.cpp
index 2d0c9ba1a37..fb8a23ea9b1 100644
--- a/src/Interpreters/TreeOptimizer.cpp
+++ b/src/Interpreters/TreeOptimizer.cpp
@@ -15,7 +15,6 @@
 #include <Interpreters/FunctionMaskingArgumentCheckVisitor.h>
 #include <Interpreters/RedundantFunctionsInOrderByVisitor.h>
 #include <Interpreters/RewriteCountVariantsVisitor.h>
-#include <Interpreters/MonotonicityCheckVisitor.h>
 #include <Interpreters/ConvertStringsToEnumVisitor.h>
 #include <Interpreters/ConvertFunctionOrLikeVisitor.h>
 #include <Interpreters/RewriteFunctionToSubcolumnVisitor.h>

From 034256b4056a4c89ff430c65dd779dca0ce0ed5d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 13 May 2024 00:25:29 +0200
Subject: [PATCH 254/289] Fix test

---
 tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh b/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
index 5dd5e8c4030..f27b11bb0c5 100755
--- a/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
+++ b/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
@@ -10,5 +10,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 #
 # Also note, that to rely on this test one should assume that CI packages uses
 # ThinLTO builds.
+#
+# Due to inlining, it can show vector instead of Exception.cpp
 
-$CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)' |& grep -c 'Common/Exception.cpp:[0-9]*: DB::Exception::Exception' || $CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)'
+$CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)' |& grep -c -P '(Common/Exception.cpp|libcxx/include/vector):[0-9]*: DB::Exception::Exception' || $CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)'

From 9c21066c9bd69db77f84353284a6b35c8d94c3f5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 13 May 2024 00:26:18 +0200
Subject: [PATCH 255/289] Useless changes

---
 utils/keeper-data-dumper/main.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index ee50e9780e2..25be8549dd6 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -98,3 +98,5 @@ int main(int argc, char *argv[])
 
     return 0;
 }
+
+// NOLINTEND(clang-analyzer-optin.core.EnumCastOutOfRange)

From b3e6259a3cf8dcef16369b9afaf4dda1afd90731 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 13 May 2024 02:41:14 +0200
Subject: [PATCH 256/289] Fix test

---
 tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh b/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
index f27b11bb0c5..1b16316e228 100755
--- a/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
+++ b/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
@@ -13,4 +13,4 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 #
 # Due to inlining, it can show vector instead of Exception.cpp
 
-$CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)' |& grep -c -P '(Common/Exception.cpp|libcxx/include/vector):[0-9]*: DB::Exception::Exception' || $CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)'
+$CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)' |& grep -q -P '(Common/Exception.cpp|libcxx/include/vector):[0-9]*: DB::Exception::Exception' && echo 1 || $CLICKHOUSE_LOCAL --stacktrace -q 'select throwIf(1)'

From 4eb42bba8fe80f64ef78514d01ee72f1a8bc3a2c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 13 May 2024 07:16:26 +0200
Subject: [PATCH 257/289] Fix test

---
 tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh b/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
index 1b16316e228..3da26d5046d 100755
--- a/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
+++ b/tests/queries/0_stateless/02420_stracktrace_debug_symbols.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# shellcheck disable=SC2015
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From 033155d8fad46e81eb97e522e48afe37484da2c7 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 13 May 2024 09:05:42 +0000
Subject: [PATCH 258/289] Parallel replicas: simple cleanup

---
 src/Storages/MergeTree/MarkRange.h                   |  1 -
 .../MergeTree/ParallelReplicasReadingCoordinator.cpp | 12 +++---------
 .../MergeTree/ParallelReplicasReadingCoordinator.h   |  3 +--
 3 files changed, 4 insertions(+), 12 deletions(-)

diff --git a/src/Storages/MergeTree/MarkRange.h b/src/Storages/MergeTree/MarkRange.h
index f36d5d89825..626d4e9e689 100644
--- a/src/Storages/MergeTree/MarkRange.h
+++ b/src/Storages/MergeTree/MarkRange.h
@@ -2,7 +2,6 @@
 
 #include <cstddef>
 #include <deque>
-#include <set>
 
 #include <fmt/core.h>
 #include <fmt/format.h>
diff --git a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
index 7d9691b847d..d4594f294c9 100644
--- a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
+++ b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
@@ -981,10 +981,7 @@ void ParallelReplicasReadingCoordinator::handleInitialAllRangesAnnouncement(Init
     std::lock_guard lock(mutex);
 
     if (!pimpl)
-    {
-        mode = announcement.mode;
-        initialize();
-    }
+        initialize(announcement.mode);
 
     return pimpl->handleInitialAllRangesAnnouncement(std::move(announcement));
 }
@@ -996,10 +993,7 @@ ParallelReadResponse ParallelReplicasReadingCoordinator::handleRequest(ParallelR
     std::lock_guard lock(mutex);
 
     if (!pimpl)
-    {
-        mode = request.mode;
-        initialize();
-    }
+        initialize(request.mode);
 
     const auto replica_num = request.replica_num;
     auto response = pimpl->handleRequest(std::move(request));
@@ -1024,7 +1018,7 @@ void ParallelReplicasReadingCoordinator::markReplicaAsUnavailable(size_t replica
         pimpl->markReplicaAsUnavailable(replica_number);
 }
 
-void ParallelReplicasReadingCoordinator::initialize()
+void ParallelReplicasReadingCoordinator::initialize(CoordinationMode mode)
 {
     switch (mode)
     {
diff --git a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.h b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.h
index 9cba7d8e8c2..60343988f03 100644
--- a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.h
+++ b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.h
@@ -31,12 +31,11 @@ public:
     void setProgressCallback(ProgressCallback callback);
 
 private:
-    void initialize();
+    void initialize(CoordinationMode mode);
 
     std::mutex mutex;
     size_t replicas_count{0};
     size_t mark_segment_size{0};
-    CoordinationMode mode{CoordinationMode::Default};
     std::unique_ptr<ImplInterface> pimpl;
     ProgressCallback progress_callback; // store the callback only to bypass it to coordinator implementation
     std::set<size_t> replicas_used;

From f0704624fcaa901ef5dedefc4c2885dda971860c Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Mon, 13 May 2024 09:40:18 +0000
Subject: [PATCH 259/289] fix test

---
 .../0_stateless/03150_grouping_sets_use_nulls_pushdown.sql      | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql
index 6162f55ac8f..a0bd1381351 100644
--- a/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql
+++ b/tests/queries/0_stateless/03150_grouping_sets_use_nulls_pushdown.sql
@@ -27,12 +27,14 @@ SELECT *
 FROM ( SELECT * FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (day_, type_1), (day_) ) )
 WHERE day_ = '2023-01-05'
 GROUP BY *
+ORDER BY ALL
 SETTINGS allow_experimental_analyzer=1;
 
 SELECT *
 FROM ( SELECT * FROM test_grouping_sets_predicate GROUP BY GROUPING SETS ( (*), (day_) ) )
 WHERE day_ = '2023-01-05'
 GROUP BY GROUPING SETS (*)
+ORDER BY type_1
 SETTINGS allow_experimental_analyzer=1;
 
 SELECT *

From e65dd3d93930e8d2c7b2f8d60162674c840da81b Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 13 May 2024 12:36:29 +0200
Subject: [PATCH 260/289] Cancel S3 reads properly when parallel reads are used

---
 src/IO/ReadBufferFromS3.cpp | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/IO/ReadBufferFromS3.cpp b/src/IO/ReadBufferFromS3.cpp
index 813546aa052..51ba8b15e9f 100644
--- a/src/IO/ReadBufferFromS3.cpp
+++ b/src/IO/ReadBufferFromS3.cpp
@@ -191,10 +191,14 @@ size_t ReadBufferFromS3::readBigAt(char * to, size_t n, size_t range_begin, cons
             result = sendRequest(attempt, range_begin, range_begin + n - 1);
             std::istream & istr = result->GetBody();
 
-            copyFromIStreamWithProgressCallback(istr, to, n, progress_callback, &bytes_copied);
+            bool cancelled = false;
+            copyFromIStreamWithProgressCallback(istr, to, n, progress_callback, &bytes_copied, &cancelled);
 
             ProfileEvents::increment(ProfileEvents::ReadBufferFromS3Bytes, bytes_copied);
 
+            if (cancelled)
+                return initial_n - n;
+
             if (read_settings.remote_throttler)
                 read_settings.remote_throttler->add(bytes_copied, ProfileEvents::RemoteReadThrottlerBytes, ProfileEvents::RemoteReadThrottlerSleepMicroseconds);
 

From b8c719f86601780d79de507ef57a0c6e2a8530ad Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 13 May 2024 13:41:47 +0300
Subject: [PATCH 261/289] Analyzer view read only necessary columns

---
 .../InterpreterSelectQueryAnalyzer.cpp        | 54 ++++++++++++++-----
 .../InterpreterSelectQueryAnalyzer.h          |  6 ++-
 src/Storages/StorageView.cpp                  |  2 +-
 ...view_read_only_necessary_columns.reference |  8 +++
 ...lyzer_view_read_only_necessary_columns.sql | 14 +++++
 5 files changed, 68 insertions(+), 16 deletions(-)
 create mode 100644 tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.reference
 create mode 100644 tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.sql

diff --git a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
index 539d7a59f6f..0e823a6b869 100644
--- a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
+++ b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
@@ -5,6 +5,8 @@
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTSubquery.h>
+#include <Parsers/ASTTablesInSelectQuery.h>
+#include <Parsers/ASTIdentifier.h>
 
 #include <DataTypes/DataTypesNumber.h>
 
@@ -38,22 +40,46 @@ namespace ErrorCodes
 namespace
 {
 
-ASTPtr normalizeAndValidateQuery(const ASTPtr & query)
+ASTPtr normalizeAndValidateQuery(const ASTPtr & query, const Names & column_names)
 {
+    ASTPtr result_query;
+
     if (query->as<ASTSelectWithUnionQuery>() || query->as<ASTSelectQuery>())
-    {
-        return query;
-    }
+        result_query = query;
     else if (auto * subquery = query->as<ASTSubquery>())
-    {
-        return subquery->children[0];
-    }
+        result_query = subquery->children[0];
     else
-    {
         throw Exception(ErrorCodes::UNSUPPORTED_METHOD,
             "Expected ASTSelectWithUnionQuery or ASTSelectQuery. Actual {}",
             query->formatForErrorMessage());
-    }
+
+    if (column_names.empty())
+        return result_query;
+
+    auto select_query = std::make_shared<ASTSelectQuery>();
+
+    auto result_table_expression_ast = std::make_shared<ASTTableExpression>();
+    result_table_expression_ast->children.push_back(std::make_shared<ASTSubquery>(std::move(result_query)));
+    result_table_expression_ast->subquery = result_table_expression_ast->children.back();
+
+    auto tables_in_select_query_element_ast = std::make_shared<ASTTablesInSelectQueryElement>();
+    tables_in_select_query_element_ast->children.push_back(std::move(result_table_expression_ast));
+    tables_in_select_query_element_ast->table_expression = tables_in_select_query_element_ast->children.back();
+
+    ASTPtr tables_in_select_query_ast = std::make_shared<ASTTablesInSelectQuery>();
+    tables_in_select_query_ast->children.push_back(std::move(tables_in_select_query_element_ast));
+
+    select_query->setExpression(ASTSelectQuery::Expression::TABLES, std::move(tables_in_select_query_ast));
+
+    auto projection_expression_list_ast = std::make_shared<ASTExpressionList>();
+    projection_expression_list_ast->children.reserve(column_names.size());
+
+    for (const auto & column_name : column_names)
+        projection_expression_list_ast->children.push_back(std::make_shared<ASTIdentifier>(column_name));
+
+    select_query->setExpression(ASTSelectQuery::Expression::SELECT, std::move(projection_expression_list_ast));
+
+    return select_query;
 }
 
 ContextMutablePtr buildContext(const ContextPtr & context, const SelectQueryOptions & select_query_options)
@@ -125,8 +151,9 @@ QueryTreeNodePtr buildQueryTreeAndRunPasses(const ASTPtr & query,
 InterpreterSelectQueryAnalyzer::InterpreterSelectQueryAnalyzer(
     const ASTPtr & query_,
     const ContextPtr & context_,
-    const SelectQueryOptions & select_query_options_)
-    : query(normalizeAndValidateQuery(query_))
+    const SelectQueryOptions & select_query_options_,
+    const Names & column_names)
+    : query(normalizeAndValidateQuery(query_, column_names))
     , context(buildContext(context_, select_query_options_))
     , select_query_options(select_query_options_)
     , query_tree(buildQueryTreeAndRunPasses(query, select_query_options, context, nullptr /*storage*/))
@@ -138,8 +165,9 @@ InterpreterSelectQueryAnalyzer::InterpreterSelectQueryAnalyzer(
     const ASTPtr & query_,
     const ContextPtr & context_,
     const StoragePtr & storage_,
-    const SelectQueryOptions & select_query_options_)
-    : query(normalizeAndValidateQuery(query_))
+    const SelectQueryOptions & select_query_options_,
+    const Names & column_names)
+    : query(normalizeAndValidateQuery(query_, column_names))
     , context(buildContext(context_, select_query_options_))
     , select_query_options(select_query_options_)
     , query_tree(buildQueryTreeAndRunPasses(query, select_query_options, context, storage_))
diff --git a/src/Interpreters/InterpreterSelectQueryAnalyzer.h b/src/Interpreters/InterpreterSelectQueryAnalyzer.h
index 2ad7e6a50f3..73c524cbe28 100644
--- a/src/Interpreters/InterpreterSelectQueryAnalyzer.h
+++ b/src/Interpreters/InterpreterSelectQueryAnalyzer.h
@@ -16,7 +16,8 @@ public:
     /// Initialize interpreter with query AST
     InterpreterSelectQueryAnalyzer(const ASTPtr & query_,
         const ContextPtr & context_,
-        const SelectQueryOptions & select_query_options_);
+        const SelectQueryOptions & select_query_options_,
+        const Names & column_names = {});
 
     /** Initialize interpreter with query AST and storage.
       * After query tree is built left most table expression is replaced with table node that
@@ -25,7 +26,8 @@ public:
     InterpreterSelectQueryAnalyzer(const ASTPtr & query_,
         const ContextPtr & context_,
         const StoragePtr & storage_,
-        const SelectQueryOptions & select_query_options_);
+        const SelectQueryOptions & select_query_options_,
+        const Names & column_names = {});
 
     /** Initialize interpreter with query tree.
       * No query tree passes are applied.
diff --git a/src/Storages/StorageView.cpp b/src/Storages/StorageView.cpp
index db568a1d5ab..016de94c17c 100644
--- a/src/Storages/StorageView.cpp
+++ b/src/Storages/StorageView.cpp
@@ -164,7 +164,7 @@ void StorageView::read(
 
     if (context->getSettingsRef().allow_experimental_analyzer)
     {
-        InterpreterSelectQueryAnalyzer interpreter(current_inner_query, getViewContext(context, storage_snapshot), options);
+        InterpreterSelectQueryAnalyzer interpreter(current_inner_query, getViewContext(context, storage_snapshot), options, column_names);
         interpreter.addStorageLimits(*query_info.storage_limits);
         query_plan = std::move(interpreter).extractQueryPlan();
     }
diff --git a/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.reference b/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.reference
new file mode 100644
index 00000000000..0ec4e34ebfe
--- /dev/null
+++ b/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.reference
@@ -0,0 +1,8 @@
+Expression ((Project names + Projection))
+Header: sum(id) UInt64
+  Aggregating
+  Header: sum(__table1.id) UInt64
+    Expression ((Before GROUP BY + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers))))))))))
+    Header: __table1.id UInt64
+      ReadFromPreparedSource (Read from NullSource)
+      Header: id UInt64
diff --git a/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.sql b/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.sql
new file mode 100644
index 00000000000..c7cce50c2b7
--- /dev/null
+++ b/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.sql
@@ -0,0 +1,14 @@
+DROP TABLE IF EXISTS test_table;
+CREATE TABLE test_table
+(
+    id UInt64,
+    value String
+) ENGINE=MergeTree ORDER BY id;
+
+DROP VIEW IF EXISTS test_view;
+CREATE VIEW test_view AS SELECT id, value FROM test_table;
+
+EXPLAIN header = 1 SELECT sum(id) FROM test_view;
+
+DROP VIEW test_view;
+DROP TABLE test_table;

From 13b2980761d531b5fab123cee5a6a4c2413acbdf Mon Sep 17 00:00:00 2001
From: Mark Needham <m.h.needham@gmail.com>
Date: Mon, 13 May 2024 11:59:47 +0100
Subject: [PATCH 262/289] Explain map insertion order

---
 docs/en/sql-reference/data-types/map.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/en/sql-reference/data-types/map.md b/docs/en/sql-reference/data-types/map.md
index 9d495126d28..18c7816f811 100644
--- a/docs/en/sql-reference/data-types/map.md
+++ b/docs/en/sql-reference/data-types/map.md
@@ -7,6 +7,7 @@ sidebar_label: Map(K, V)
 # Map(K, V)
 
 `Map(K, V)` data type stores `key:value` pairs.
+The Map datatype is implemented as `Array(Tuple(key T1, value T2))`, which means that the order of keys in each map does not change, i.e., this data type maintains insertion order.
 
 **Parameters**
 

From fefd071ec740320e15caf6b6c43e9e5db5beb25e Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 13 May 2024 15:20:02 +0300
Subject: [PATCH 263/289] Fixed tests

---
 ...istributed_group_by_sharding_key.reference | 20 +++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.reference b/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.reference
index 212dd348edb..5acefdb365e 100644
--- a/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.reference
+++ b/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.reference
@@ -77,7 +77,7 @@ Expression (Project names)
   Distinct (DISTINCT)
     Union
       Distinct (Preliminary DISTINCT)
-        Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers)))))))
+        Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers))))))))))
           ReadFromSystemNumbers
       ReadFromRemote (Read from remote replica)
 explain select distinct k1, k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- optimized
@@ -85,7 +85,7 @@ Union
   Expression (Project names)
     Distinct (DISTINCT)
       Distinct (Preliminary DISTINCT)
-        Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers)))))))
+        Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers))))))))))
           ReadFromSystemNumbers
   ReadFromRemote (Read from remote replica)
 explain select distinct on (k1) k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- not optimized
@@ -94,7 +94,7 @@ Expression (Project names)
     Union
       Expression (Before LIMIT BY)
         LimitBy
-          Expression ((Before LIMIT BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))))
+          Expression ((Before LIMIT BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))))))))
             ReadFromSystemNumbers
       Expression
         ReadFromRemote (Read from remote replica)
@@ -102,7 +102,7 @@ explain select distinct on (k1, k2) v from remote('127.{1,2}', view(select 1 k1,
 Union
   Expression (Project names)
     LimitBy
-      Expression ((Before LIMIT BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))))
+      Expression ((Before LIMIT BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))))))))
         ReadFromSystemNumbers
   ReadFromRemote (Read from remote replica)
 explain select distinct k1 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- not optimized
@@ -113,7 +113,7 @@ Expression (Project names)
         Sorting (Sorting for ORDER BY)
           Expression (Before ORDER BY)
             Distinct (Preliminary DISTINCT)
-              Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers)))))))
+              Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers))))))))))
                 ReadFromSystemNumbers
         ReadFromRemote (Read from remote replica)
 explain select distinct k1, k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- optimized
@@ -124,7 +124,7 @@ Expression (Project names)
         Sorting (Sorting for ORDER BY)
           Expression (Before ORDER BY)
             Distinct (Preliminary DISTINCT)
-              Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers)))))))
+              Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers))))))))))
                 ReadFromSystemNumbers
       ReadFromRemote (Read from remote replica)
 explain select distinct on (k1) k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- not optimized
@@ -134,9 +134,9 @@ Expression (Project names)
       Sorting (Merge sorted streams for ORDER BY, without aggregation)
         Union
           LimitBy
-            Expression ((Before LIMIT BY + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))) [lifted up part]))
+            Expression ((Before LIMIT BY + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))))))) [lifted up part]))
               Sorting (Sorting for ORDER BY)
-                Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))))
+                Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))))))))
                   ReadFromSystemNumbers
           ReadFromRemote (Read from remote replica)
 explain select distinct on (k1, k2) v from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- optimized
@@ -144,8 +144,8 @@ Expression (Project names)
   Sorting (Merge sorted streams after aggregation stage for ORDER BY)
     Union
       LimitBy
-        Expression ((Before LIMIT BY + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))) [lifted up part]))
+        Expression ((Before LIMIT BY + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))))))) [lifted up part]))
           Sorting (Sorting for ORDER BY)
-            Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))))
+            Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + Change column names to column identifiers)))))))))))
               ReadFromSystemNumbers
       ReadFromRemote (Read from remote replica)

From bb9652998b77a9150cc04e61cbef4f5cac291855 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 13 May 2024 12:26:10 +0000
Subject: [PATCH 264/289] Another attemtp.

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     |  8 ++++++-
 ...up_by_use_nulls_analyzer_crashes.reference | 21 +++++++++++++++++++
 ...23_group_by_use_nulls_analyzer_crashes.sql |  4 ++++
 3 files changed, 32 insertions(+), 1 deletion(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 62e469e545a..1386f3db612 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -6516,7 +6516,13 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
 
     validateTreeSize(node, scope.context->getSettingsRef().max_expanded_ast_elements, node_to_tree_size);
 
-    if (!scope.expressions_in_resolve_process_stack.hasAggregateFunction())
+    /// Lambda can be inside the aggregate function, so we should check parent scopes.
+    /// Most likely only the root scope can have an arrgegate function, but let's check all just in case.
+    bool in_aggregate_function_scope = false;
+    for (const auto * scope_ptr = &scope; scope_ptr; scope_ptr = scope_ptr->parent_scope)
+        in_aggregate_function_scope = in_aggregate_function_scope || scope_ptr->expressions_in_resolve_process_stack.hasAggregateFunction();
+
+    if (!in_aggregate_function_scope)
     {
         for (const auto * scope_ptr = &scope; scope_ptr; scope_ptr = scope_ptr->parent_scope)
         {
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
index c2dcb613411..02ea01eb2e6 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.reference
@@ -103,3 +103,24 @@ a	a
 []
 []
 []
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+10
diff --git a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
index deb6382aa36..b8c173520a9 100644
--- a/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
+++ b/tests/queries/0_stateless/03023_group_by_use_nulls_analyzer_crashes.sql
@@ -53,3 +53,7 @@ SELECT arraySplit(x -> 0, []) WHERE materialize(1) GROUP BY (0, ignore('a')) WIT
 SELECT arraySplit(x -> toUInt8(number), []) from numbers(1) GROUP BY toUInt8(number) WITH ROLLUP SETTINGS group_by_use_nulls = 1;
 
 SELECT arraySplit(number -> toUInt8(number), []) from numbers(1) GROUP BY toUInt8(number) WITH ROLLUP SETTINGS group_by_use_nulls = 1;
+
+SELECT count(arraySplit(number -> toUInt8(number), [arraySplit(x -> toUInt8(number), [])])) FROM numbers(10) GROUP BY number, [number] WITH ROLLUP settings group_by_use_nulls=1; -- {serverError ILLEGAL_TYPE_OF_ARGUMENT}
+
+SELECT count(arraySplit(x -> toUInt8(number), [])) FROM numbers(10) GROUP BY number, [number] WITH ROLLUP settings group_by_use_nulls=1;
\ No newline at end of file

From aff8bea1e67c92d1d0bcebfccadafc8394c967e3 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 13 May 2024 12:47:19 +0000
Subject: [PATCH 265/289] selectRangesToRead() simple cleanup

---
 .../optimizeUseAggregateProjection.cpp        |  4 +---
 .../optimizeUseNormalProjection.cpp           |  4 +---
 .../QueryPlan/ReadFromMergeTree.cpp           | 23 +++++++++++++++----
 src/Processors/QueryPlan/ReadFromMergeTree.h  |  2 ++
 4 files changed, 22 insertions(+), 11 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp b/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
index 64111602458..30ff9970790 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
@@ -579,8 +579,6 @@ bool optimizeUseAggregateProjections(QueryPlan::Node & node, QueryPlan::Nodes &
 
     auto candidates = getAggregateProjectionCandidates(node, *aggregating, *reading, max_added_blocks, allow_implicit_projections);
 
-    const auto & parts = reading->getParts();
-    const auto & alter_conversions = reading->getAlterConvertionsForParts();
     const auto & query_info = reading->getQueryInfo();
     const auto metadata = reading->getStorageMetadata();
     ContextPtr context = reading->getContext();
@@ -592,7 +590,7 @@ bool optimizeUseAggregateProjections(QueryPlan::Node & node, QueryPlan::Nodes &
     }
     else if (!candidates.real.empty())
     {
-        auto ordinary_reading_select_result = reading->selectRangesToRead(parts, alter_conversions);
+        auto ordinary_reading_select_result = reading->selectRangesToRead();
         size_t ordinary_reading_marks = ordinary_reading_select_result->selected_marks;
 
         /// Nothing to read. Ignore projections.
diff --git a/src/Processors/QueryPlan/Optimizations/optimizeUseNormalProjection.cpp b/src/Processors/QueryPlan/Optimizations/optimizeUseNormalProjection.cpp
index cac172a856f..13c6c6b0821 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeUseNormalProjection.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeUseNormalProjection.cpp
@@ -136,12 +136,10 @@ bool optimizeUseNormalProjections(Stack & stack, QueryPlan::Nodes & nodes)
     NormalProjectionCandidate * best_candidate = nullptr;
 
     const Names & required_columns = reading->getAllColumnNames();
-    const auto & parts = reading->getParts();
-    const auto & alter_conversions = reading->getAlterConvertionsForParts();
     const auto & query_info = reading->getQueryInfo();
     MergeTreeDataSelectExecutor reader(reading->getMergeTreeData());
 
-    auto ordinary_reading_select_result = reading->selectRangesToRead(parts, alter_conversions);
+    auto ordinary_reading_select_result = reading->selectRangesToRead();
     size_t ordinary_reading_marks = ordinary_reading_select_result->selected_marks;
 
     /// Nothing to read. Ignore projections.
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 68b145f259d..e523a2c243c 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -1364,11 +1364,27 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
         return merging_pipes.empty() ? Pipe::unitePipes(std::move(no_merging_pipes)) : Pipe::unitePipes(std::move(merging_pipes));
 }
 
+ReadFromMergeTree::AnalysisResultPtr ReadFromMergeTree::selectRangesToRead() const
+{
+    return selectRangesToReadImpl(
+        prepared_parts,
+        alter_conversions_for_parts,
+        metadata_for_reading,
+        query_info,
+        context,
+        requested_num_streams,
+        max_block_numbers_to_read,
+        data,
+        all_column_names,
+        log,
+        indexes);
+}
+
 ReadFromMergeTree::AnalysisResultPtr ReadFromMergeTree::selectRangesToRead(
     MergeTreeData::DataPartsVector parts,
     std::vector<AlterConversionsPtr> alter_conversions) const
 {
-    return selectRangesToRead(
+    return selectRangesToReadImpl(
         std::move(parts),
         std::move(alter_conversions),
         metadata_for_reading,
@@ -1855,10 +1871,7 @@ bool ReadFromMergeTree::requestOutputEachPartitionThroughSeparatePort()
 
 ReadFromMergeTree::AnalysisResult ReadFromMergeTree::getAnalysisResult() const
 {
-    auto result_ptr = analyzed_result_ptr
-        ? analyzed_result_ptr
-        : selectRangesToRead(prepared_parts, alter_conversions_for_parts);
-
+    auto result_ptr = analyzed_result_ptr ? analyzed_result_ptr : selectRangesToRead();
     return *result_ptr;
 }
 
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.h b/src/Processors/QueryPlan/ReadFromMergeTree.h
index f512ba9e0ae..5d7879e8dee 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.h
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.h
@@ -167,6 +167,8 @@ public:
         MergeTreeData::DataPartsVector parts,
         std::vector<AlterConversionsPtr> alter_conversions) const;
 
+    AnalysisResultPtr selectRangesToRead() const;
+
     StorageMetadataPtr getStorageMetadata() const { return metadata_for_reading; }
 
     /// Returns `false` if requested reading cannot be performed.

From 5e1a3b560174dd26ed35bafdb582a2a5e05d771a Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Mon, 13 May 2024 14:48:33 +0200
Subject: [PATCH 266/289] Update
 src/Interpreters/InterpreterSelectQueryAnalyzer.cpp

---
 src/Interpreters/InterpreterSelectQueryAnalyzer.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
index 0e823a6b869..d4af111eec0 100644
--- a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
+++ b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
@@ -56,6 +56,7 @@ ASTPtr normalizeAndValidateQuery(const ASTPtr & query, const Names & column_name
     if (column_names.empty())
         return result_query;
 
+    /// The initial query the VIEW references to is wrapped here with another SELECT query to allow reading only necessary columns.
     auto select_query = std::make_shared<ASTSelectQuery>();
 
     auto result_table_expression_ast = std::make_shared<ASTTableExpression>();

From 2b38b8a97b6d2bccc4714e533071c6285426989d Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Mon, 13 May 2024 14:49:26 +0200
Subject: [PATCH 267/289] Correct byte count

---
 src/IO/ReadBufferFromS3.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/IO/ReadBufferFromS3.cpp b/src/IO/ReadBufferFromS3.cpp
index 51ba8b15e9f..690aaaa42d8 100644
--- a/src/IO/ReadBufferFromS3.cpp
+++ b/src/IO/ReadBufferFromS3.cpp
@@ -197,7 +197,7 @@ size_t ReadBufferFromS3::readBigAt(char * to, size_t n, size_t range_begin, cons
             ProfileEvents::increment(ProfileEvents::ReadBufferFromS3Bytes, bytes_copied);
 
             if (cancelled)
-                return initial_n - n;
+                return initial_n - n - bytes_copied;
 
             if (read_settings.remote_throttler)
                 read_settings.remote_throttler->add(bytes_copied, ProfileEvents::RemoteReadThrottlerBytes, ProfileEvents::RemoteReadThrottlerSleepMicroseconds);

From 449aacb3d04b5cbd4639512af53235bcce1ab664 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Mon, 13 May 2024 15:08:52 +0200
Subject: [PATCH 268/289] Correct

---
 src/IO/ReadBufferFromS3.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/IO/ReadBufferFromS3.cpp b/src/IO/ReadBufferFromS3.cpp
index 690aaaa42d8..8823af55936 100644
--- a/src/IO/ReadBufferFromS3.cpp
+++ b/src/IO/ReadBufferFromS3.cpp
@@ -197,7 +197,7 @@ size_t ReadBufferFromS3::readBigAt(char * to, size_t n, size_t range_begin, cons
             ProfileEvents::increment(ProfileEvents::ReadBufferFromS3Bytes, bytes_copied);
 
             if (cancelled)
-                return initial_n - n - bytes_copied;
+                return initial_n - n + bytes_copied;
 
             if (read_settings.remote_throttler)
                 read_settings.remote_throttler->add(bytes_copied, ProfileEvents::RemoteReadThrottlerBytes, ProfileEvents::RemoteReadThrottlerSleepMicroseconds);

From 2458defd0195a36e0ad98161a5f6ae014f01ca92 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Mon, 13 May 2024 15:16:35 +0200
Subject: [PATCH 269/289] Analyzer: Forbid WINDOW redefinition

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp                 | 7 ++++++-
 .../03149_analyzer_window_redefinition.reference          | 0
 .../0_stateless/03149_analyzer_window_redefinition.sql    | 8 ++++++++
 3 files changed, 14 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03149_analyzer_window_redefinition.reference
 create mode 100644 tests/queries/0_stateless/03149_analyzer_window_redefinition.sql

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 52efee03ae4..dea56de8673 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -8009,7 +8009,12 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
             window_node_typed.setParentWindowName({});
         }
 
-        scope.window_name_to_window_node.emplace(window_node_typed.getAlias(), window_node);
+        auto [_, inserted] = scope.window_name_to_window_node.emplace(window_node_typed.getAlias(), window_node);
+        if (!inserted)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                "Window '{}' is already defined. In scope {}",
+                window_node_typed.getAlias(),
+                scope.scope_node->formatASTForErrorMessage());
     }
 
     /** Disable identifier cache during JOIN TREE resolve.
diff --git a/tests/queries/0_stateless/03149_analyzer_window_redefinition.reference b/tests/queries/0_stateless/03149_analyzer_window_redefinition.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03149_analyzer_window_redefinition.sql b/tests/queries/0_stateless/03149_analyzer_window_redefinition.sql
new file mode 100644
index 00000000000..7bc5ec7579c
--- /dev/null
+++ b/tests/queries/0_stateless/03149_analyzer_window_redefinition.sql
@@ -0,0 +1,8 @@
+CREATE TABLE users (uid Int16, name String, age Int16) ENGINE=MergeTree ORDER BY tuple();
+
+INSERT INTO users VALUES (1231, 'John', 33);
+INSERT INTO users VALUES (6666, 'Ksenia', 48);
+INSERT INTO users VALUES (8888, 'Alice', 50);
+
+SELECT count(*) OVER w 
+FROM users WINDOW w AS (ORDER BY uid), w AS(ORDER BY name); -- { serverError BAD_ARGUMENTS }

From bd8cad1d8effdd1ab3296048a57fe304e23633c7 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 13 May 2024 15:10:51 +0000
Subject: [PATCH 270/289] Fix fuzzed analyzer_join_with_constant query

---
 src/Planner/CollectSets.cpp                                 | 6 ++++++
 .../02479_analyzer_join_with_constants.reference            | 2 ++
 .../0_stateless/02479_analyzer_join_with_constants.sql      | 5 +++++
 3 files changed, 13 insertions(+)

diff --git a/src/Planner/CollectSets.cpp b/src/Planner/CollectSets.cpp
index d62ad83c6b2..52a0d748d63 100644
--- a/src/Planner/CollectSets.cpp
+++ b/src/Planner/CollectSets.cpp
@@ -36,6 +36,12 @@ public:
 
     void visitImpl(const QueryTreeNodePtr & node)
     {
+        if (const auto * constant_node = node->as<ConstantNode>())
+            /// Collect sets from source expression as well.
+            /// Most likely we will not build them, but those sets could be requested during analysis.
+            if (constant_node->hasSourceExpression())
+                collectSets(constant_node->getSourceExpression(), planner_context);
+
         auto * function_node = node->as<FunctionNode>();
         if (!function_node || !isNameOfInFunction(function_node->getFunctionName()))
             return;
diff --git a/tests/queries/0_stateless/02479_analyzer_join_with_constants.reference b/tests/queries/0_stateless/02479_analyzer_join_with_constants.reference
index 3a23cce46b4..72393057dbf 100644
--- a/tests/queries/0_stateless/02479_analyzer_join_with_constants.reference
+++ b/tests/queries/0_stateless/02479_analyzer_join_with_constants.reference
@@ -8,3 +8,5 @@
 --
 1	1	0	0
 --
+--
+1	1	0	0
diff --git a/tests/queries/0_stateless/02479_analyzer_join_with_constants.sql b/tests/queries/0_stateless/02479_analyzer_join_with_constants.sql
index 50248665bc9..bf081bed228 100644
--- a/tests/queries/0_stateless/02479_analyzer_join_with_constants.sql
+++ b/tests/queries/0_stateless/02479_analyzer_join_with_constants.sql
@@ -25,3 +25,8 @@ SELECT * FROM (SELECT 1 AS id, 1 AS value) AS t1 ASOF LEFT JOIN (SELECT 1 AS id,
 SELECT '--';
 
 SELECT b.dt FROM (SELECT NULL > NULL AS pk, 1 AS dt FROM numbers(5)) AS a ASOF LEFT JOIN (SELECT NULL AS pk, 1 AS dt) AS b ON (a.pk = b.pk) AND 1 != 1 AND (a.dt >= b.dt); -- { serverError 403, NOT_FOUND_COLUMN_IN_BLOCK }
+
+SELECT '--';
+
+-- Fuzzed
+SELECT * FROM (SELECT 1 AS id, 1 AS value) AS t1 ASOF LEFT JOIN (SELECT 1 AS id, 1 AS value) AS t2 ON (t1.id = t2.id) AND (toUInt256(1) IN (SELECT materialize(1))) AND (1 != 1) AND (t1.value >= t2.value);

From f89e05c15b94056f6c019a0ff05d158808a59e59 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 13 May 2024 18:05:26 +0200
Subject: [PATCH 271/289] Update
 03151_analyzer_view_read_only_necessary_columns.sql

---
 .../03151_analyzer_view_read_only_necessary_columns.sql         | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.sql b/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.sql
index c7cce50c2b7..40204b5cd03 100644
--- a/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.sql
+++ b/tests/queries/0_stateless/03151_analyzer_view_read_only_necessary_columns.sql
@@ -8,7 +8,7 @@ CREATE TABLE test_table
 DROP VIEW IF EXISTS test_view;
 CREATE VIEW test_view AS SELECT id, value FROM test_table;
 
-EXPLAIN header = 1 SELECT sum(id) FROM test_view;
+EXPLAIN header = 1 SELECT sum(id) FROM test_view settings allow_experimental_analyzer=1;
 
 DROP VIEW test_view;
 DROP TABLE test_table;

From c1a03eca6f35ed4af23b70696f757b07f2d44103 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 13 May 2024 18:22:59 +0200
Subject: [PATCH 272/289] Add missing explicit instantiations of ColumnUnique

---
 src/Columns/ColumnUnique.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Columns/ColumnUnique.cpp b/src/Columns/ColumnUnique.cpp
index edfee69a752..54f45204c00 100644
--- a/src/Columns/ColumnUnique.cpp
+++ b/src/Columns/ColumnUnique.cpp
@@ -21,5 +21,8 @@ template class ColumnUnique<ColumnFloat64>;
 template class ColumnUnique<ColumnString>;
 template class ColumnUnique<ColumnFixedString>;
 template class ColumnUnique<ColumnDateTime64>;
+template class ColumnUnique<ColumnIPv4>;
+template class ColumnUnique<ColumnIPv6>;
+template class ColumnUnique<ColumnUUID>;
 
 }

From 68e76aefc1b0c20166f8f51c40c64d505cdb5361 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 13 May 2024 18:25:32 +0200
Subject: [PATCH 273/289] Better asserts in ColumnString.h

---
 src/Columns/ColumnString.h | 19 ++++++++++++-------
 1 file changed, 12 insertions(+), 7 deletions(-)

diff --git a/src/Columns/ColumnString.h b/src/Columns/ColumnString.h
index 2d1d69ced73..cbda5466303 100644
--- a/src/Columns/ColumnString.h
+++ b/src/Columns/ColumnString.h
@@ -1,7 +1,6 @@
 #pragma once
 
 #include <cstring>
-#include <cassert>
 
 #include <Columns/IColumn.h>
 #include <Columns/IColumnImpl.h>
@@ -12,6 +11,8 @@
 #include <Common/assert_cast.h>
 #include <Core/Field.h>
 
+#include <base/defines.h>
+
 
 class Collator;
 
@@ -42,7 +43,11 @@ private:
     size_t ALWAYS_INLINE offsetAt(ssize_t i) const { return offsets[i - 1]; }
 
     /// Size of i-th element, including terminating zero.
-    size_t ALWAYS_INLINE sizeAt(ssize_t i) const { return offsets[i] - offsets[i - 1]; }
+    size_t ALWAYS_INLINE sizeAt(ssize_t i) const
+    {
+        chassert(offsets[i] > offsets[i - 1]);
+        return offsets[i] - offsets[i - 1];
+    }
 
     struct ComparatorBase;
 
@@ -79,7 +84,7 @@ public:
 
     size_t byteSizeAt(size_t n) const override
     {
-        assert(n < size());
+        chassert(n < size());
         return sizeAt(n) + sizeof(offsets[0]);
     }
 
@@ -94,25 +99,25 @@ public:
 
     Field operator[](size_t n) const override
     {
-        assert(n < size());
+        chassert(n < size());
         return Field(&chars[offsetAt(n)], sizeAt(n) - 1);
     }
 
     void get(size_t n, Field & res) const override
     {
-        assert(n < size());
+        chassert(n < size());
         res = std::string_view{reinterpret_cast<const char *>(&chars[offsetAt(n)]), sizeAt(n) - 1};
     }
 
     StringRef getDataAt(size_t n) const override
     {
-        assert(n < size());
+        chassert(n < size());
         return StringRef(&chars[offsetAt(n)], sizeAt(n) - 1);
     }
 
     bool isDefaultAt(size_t n) const override
     {
-        assert(n < size());
+        chassert(n < size());
         return sizeAt(n) == 1;
     }
 

From 9c2e1bfce6d1be25c05dc64d85463e11be6e3ebf Mon Sep 17 00:00:00 2001
From: Maxim Alexeev <ma.i.alekseev@tinkoff.ru>
Date: Mon, 13 May 2024 19:39:45 +0300
Subject: [PATCH 274/289] fixed review

---
 src/Interpreters/HashJoin.cpp                 |   10 +-
 tests/clickhouse-test                         |    1 +
 .../03151_external_cross_join.reference       |    6 +
 .../0_stateless/03151_external_cross_join.sql |   20 +
 .../00183_cross_join_external.reference       | 1000 -----------------
 .../1_stateful/00183_cross_join_external.sql  |    3 -
 6 files changed, 36 insertions(+), 1004 deletions(-)
 create mode 100644 tests/queries/0_stateless/03151_external_cross_join.reference
 create mode 100644 tests/queries/0_stateless/03151_external_cross_join.sql
 delete mode 100644 tests/queries/1_stateful/00183_cross_join_external.reference
 delete mode 100644 tests/queries/1_stateful/00183_cross_join_external.sql

diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index ce60fa24620..5f438a7e5f9 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -41,6 +41,11 @@
 #include <Functions/FunctionHelpers.h>
 #include <Interpreters/castColumn.h>
 
+namespace CurrentMetrics
+{
+    extern const Metric TemporaryFilesForJoin;
+}
+
 namespace DB
 {
 
@@ -252,7 +257,10 @@ HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_s
     , instance_id(instance_id_)
     , asof_inequality(table_join->getAsofInequality())
     , data(std::make_shared<RightTableData>())
-    , tmp_data(table_join_->getTempDataOnDisk() ? std::make_unique<TemporaryDataOnDisk>(table_join_->getTempDataOnDisk()) : nullptr)
+    , tmp_data(
+          table_join_->getTempDataOnDisk()
+              ? std::make_unique<TemporaryDataOnDisk>(table_join_->getTempDataOnDisk(), CurrentMetrics::TemporaryFilesForJoin)
+              : nullptr)
     , right_sample_block(right_sample_block_)
     , max_joined_block_rows(table_join->maxJoinedBlockRows())
     , instance_log_id(!instance_id_.empty() ? "(" + instance_id_ + ") " : "")
diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index b1ad84b71d4..cbf0a6a577f 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -751,6 +751,7 @@ class SettingsRandomizer:
         "max_read_buffer_size": lambda: random.randint(500000, 1048576),
         "prefer_localhost_replica": lambda: random.randint(0, 1),
         "max_block_size": lambda: random.randint(8000, 100000),
+        "max_joined_block_size_rows": lambda: random.randint(8000, 100000),
         "max_threads": lambda: random.randint(1, 64),
         "optimize_append_index": lambda: random.randint(0, 1),
         "optimize_if_chain_to_multiif": lambda: random.randint(0, 1),
diff --git a/tests/queries/0_stateless/03151_external_cross_join.reference b/tests/queries/0_stateless/03151_external_cross_join.reference
new file mode 100644
index 00000000000..057eadec0e4
--- /dev/null
+++ b/tests/queries/0_stateless/03151_external_cross_join.reference
@@ -0,0 +1,6 @@
+1	1	2
+10	55	11
+100	5050	101
+1000	500500	1001
+10000	50005000	10001
+100000	5000050000	100001
diff --git a/tests/queries/0_stateless/03151_external_cross_join.sql b/tests/queries/0_stateless/03151_external_cross_join.sql
new file mode 100644
index 00000000000..e0e05a10e1e
--- /dev/null
+++ b/tests/queries/0_stateless/03151_external_cross_join.sql
@@ -0,0 +1,20 @@
+DROP TABLE IF EXISTS t1;
+CREATE TABLE t1 (x Int32) ENGINE = Memory;
+
+-- insert several blocks with 1 or 2 rows:
+INSERT INTO t1 VALUES (1);
+INSERT INTO t1 VALUES (10),(100);
+INSERT INTO t1 VALUES (1000);
+INSERT INTO t1 VALUES (10000),(100000);
+
+SET max_rows_in_join = 111;
+
+SELECT x, sum(number), count(), FROM (
+    SELECT t1.x, t2.number
+    FROM t1
+    CROSS JOIN numbers_mt(10_000_000) t2
+    WHERE number <= x
+)
+GROUP BY ALL
+ORDER BY x
+;
\ No newline at end of file
diff --git a/tests/queries/1_stateful/00183_cross_join_external.reference b/tests/queries/1_stateful/00183_cross_join_external.reference
deleted file mode 100644
index ec79cc40fe7..00000000000
--- a/tests/queries/1_stateful/00183_cross_join_external.reference
+++ /dev/null
@@ -1,1000 +0,0 @@
-33553863	http://ultival.1septs
-33553862	http://full%2F4a%2Fartiry/prival Pandar &clid=4832.html?html&lang=ru&lr=2&msid=203&banerid
-33553862	http://full%2F4a%2Fartiry/prival Pandar &clid=4832.html?html&lang=ru&lr=2&msid=203&banerid
-33553742	https://myz.sutoclub
-33553742	https://myz.sutocation{fontaktering=0&session.ru/index.ru/apltras[5]=0&engine_power/user-efender
-33553742	https://myz.sutocation/search?text=коллей и солнце в
-33553161	http://life-pri-burnoe-dlya-and-na-chudopoly
-33553161	http://life-pri-burnoe-dlya-and-na-chudopoly
-33553118	http://news%2F30%2F1.2&name":"30.475065&text=в контакте
-33552544	http://m.yandsearch?text=юнис
-33552455	http://maps.yandex.ru/fashionnya_10000940877/?action-lacost_mob_contakte,facenews/864490.html?accountryasam-full
-33552449	http://top.rbc.ua/погода-харьков&img_url=http://xyyatsya.html&lang=ru&lr=2779077&text=арабатывающих
-33552449	http://top.rbc.ru/yandsearch?text=вання
-33552449	http://top.rbc.ru/yandsearch?text=ванные целевизора&lr=213&msid=2083696&text=как
-33552449	http://top.rbc.ru/yandsearch?clid=90
-33552449	http://top.rbc.ru/onliner.play.php?s=8
-33552449	http://top.rbc.ru/online.ru/disk.ru/video/embed
-33552449	http://top.rbc.ru/online.com.tr/guncel/frl-2/233
-33552449	http://top.rbc.ru/myfics.pulse.ru/yandsearch?lr=48&perialu.net
-33552449	http://top.rbc.ru/myfics.pulscence/2014/91269707723/item/6961%26nid
-33552328	http://kupit-i-lynn-na-vtorders/dokto.ru/touchshie_na_skladnaia-vlozhenshchadki
-33552328	http://kupit-i-lynn-na-tastyagazeta.ru/tverdar.org/bin.ru/viewtopics/174287200029444776ffa1ba91d43030e
-33552216	http://video/58785/?promo=10347&text=фильмы она для
-33552216	http://video/58785/?promo=10347&text=фильмы она для
-33552216	http://finam.intel
-33552216	http://finam.inpearls.html&lang=ru&lr=959&text=вконтаж
-33552099	http://rg.ru/remont_give-schet/shop.novosti/2014/9116-spalnyj-so
-33551977	http://search
-33551857	http://yandex.ua/uk/news=articles/485/mode=action=FR,B9
-33551857	http://yandex.ua/uk/news=articles/485/mode=action=FR,B9
-33551857	http://yandex.ua/uk/news=articles/485/mode=action=FR,B9
-33551857	http://yandex.ua/uk/news=articles/485/mode=action=FR,B9
-33551857	http://yandex.ru/public-tools/sanatify=nogeo=0&secret=52436
-33551857	http://yandex.ru/public-tools/sanatify=nogeo=0&secret=52436
-33551857	http://yandex.ru/public-tools/sanatify=nogeo=0&secret=52436
-33551857	http://yandex.ru/2402838/?content=on&_orders_num=4907.html#videos/doxodover/fotostransfer
-33551274	http://mysweet-tavr.ru/yandex.ru/yandsearch?clid=13259827&spn
-33551274	http://mysweet-tam-3-silya
-33551274	http://mysweet-tam-3-silya
-33550899	http://astroisshke
-33550844	http://yandex.ru/cgi-bin/msglist/meshnyi-mezhdunarod
-33550844	http://yandex.ru/?clid=20677839/pro-vospalnii-ot-mashnie_novosti/zakon
-33550801	http://sibdomashnyj-cvet-telej-modanija
-33550801	http://sibdom.net/ru/pozdrav.narutoprague/auto/geneva2014
-33550801	http://sibdom.net/ru/pozdrav.narutoprague/auto/geneva2014
-33550801	http://sibdom.com/top22013/summi-dlya-vsem-yumor_prezidents
-33550801	http://sibdom.com/search
-33550801	http://sibdom.com/search
-33550801	http://sibdom.com/search
-33550801	http://sibdom.com/search
-33550801	http://sibdom.com/search
-33550801	http://sibdom.com/search
-33550801	http://sibdom.com/magayutsya-posle-yontent.ru
-33550801	http://sibdom.29.ru/articles/ya-ukray/doktor
-33550204	http://studio/dist_pink-dis
-33549664	http://gde_timeout=144037&lr=50&from=direcommepage=0&ad_info=ElsdCQRfSVFsBgBTAw
-33549406	http://yandex.ua/user_app_versianfood.com/search?cl4url=1primea-materisi-puloveplane
-33549201	http://fashing.net/testdrive_key=506d9e3dfbd268e6b6630e58&doma
-33549131	http://images/216377821524.13951616
-33549116	https://m.haberler.ru/braun/9408215.shtml&lang=ru
-33549116	https://m.haberler.ru/braun/9408215.shtml&lang=ru
-33549116	https://m.haberler.ru/Kovalidad.fisha.lebek tanka.com.ua/news
-33549091	http://zagrams=bid%3D84841.shtml/ru/store/xml_catalog/view/2014/3
-33549091	http://zagradskaja/2011.18432133/11/maps.yandex.php?promo
-33548853	http://predir%3Fid%3D0%26height%3Daf1ea8a2981
-33548697	http://yandex.ru/jobs/florange_key=&availa-vtornye
-33548648	http://worldoftanks.ru/load.cgi%3Fsid
-33548648	http://worldoftanks.ru/140-seasonvar
-33548648	http://worldoftanks.aspx&refererleniya-bilgisa-roslanding_url
-33548648	http://worldoftanks.aspx&referereezume/vorona.org/news.yandsearch
-33548648	http://worldoftanks.aspx&referereezultator/anne_postami.ru/3628
-33548648	http://worldoftanks.aspx&referereezultator/anne_postami.ru/3628
-33548648	http://worldoftanks.aspx&referereezhischet_dorovideo/search?lr
-33548648	http://worldoftanks.aspx&referereezhimost?q=грузкаопмо
-33548648	http://worldoftanks.aspx&referereezhimost?q=грузкаопмо
-33548648	http://worldoftanks.aspx&referereezhimost?p=5758415845392595002181
-33548648	http://worldoftanks.aspx&referereezhdunarodov.ru/igri7.ru/cher
-33548648	http://worldoftanks.aspx&referereezhdugor.com/webhp?espv=1&ie=UTF
-33548648	http://worldoftanks.aspx&referereezhda-devusher.html&langualeo
-33548648	http://worldoftanks.aspx&referereezhda-devusher.html&langualeo
-33548648	http://worldoftanks.aspx&referereezh&api_resuet
-33548648	http://worldoftanks.aspx&referency=UAH&job_interzhalsya
-33548361	http://wot/htm/wotlauncheskim_tatavni.ru%2F&is_mobile
-33547846	http://yenisafak.com.ua/погода на можно ли скачать контакте&lr=194
-33547361	http://acunn.mk.ru
-33546008	http://yandex.ru/syndyk.ru/yandex.ru/view&idtv=2182
-33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
-33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
-33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
-33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
-33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
-33545847	http://f5haber7.com/play.ru/2012/100135364&secret_besplate.net/gruzovik
-33545847	http://f5haber7.com/play.php?id=1989605&lr=213&msid=2749/?page
-33545847	http://f5haber7.com/kayintov
-33545847	http://f5haber7.com/kayintov
-33545847	http://f5haber7.com/kayintov
-33545847	http://f5haber7.com/?cid=19842783179368
-33545847	http://f5haber7.com&publications/mysel-omeganovsk/telegraf
-33545847	http://f5haber7.com&publications/67459577859
-33545579	http://mamba.kg/#!/videntnogo-putin-show_doc_LAW
-33545564	http://rnd.kz/poisk.com/iframe
-33545404	http://home/shok_popundem/erohd
-33545404	http://home/lp1/?p=4&t=583906723&text=пошив бюстгальтик
-33545404	http://home/lp1/?p=10&lr=213&text=супер
-33545397	http://mp3/20/139377/link7
-33544214	http://fanatik.ru/00003536430/?gcv_source=wizard&category/4dev.ru/polos.ru/kosmeteo.ua/polit/1741824424/?from=email.ru/yandex.ru
-33543373	http://base.com.tr/firefox/295771534.shtml/ru/news.yandsearch?text=люблю 2 серия скачать
-33543373	http://base.com.tr&user=user_all=76
-33542831	https://e.mail=125456_0.html_params=bid%3D1%26xdm_e=http://news/hotel_2_druzya-trana.ru/3275/?from=odnoklass/page=1#compila-ilici-ayakkan/friendsms.ru/registralizaciya-seriya-rosiya-tv.net/?next=/id/openphX21pbmlzdHZvery
-33542831	https://e.mail.ru/my/#actions_510473759731&text=search.php?show_banner_click_id=-1&custoe
-33542407	http://wot/htm/wot/golder-uyku-3653883720
-33542270	https://moscow/ru/novostranamadi-47312196&acce285092.html/ru/lisi-na-par-liga.net/download
-33542270	https://moscow/ru/live/2014&sociologin=pros-pressage/vladtimeout=14403395141
-33542270	https://moscow/full-up-nnn.ru/index.kz/cars.autoplus-muthisweet.ru/00032014/03/melkova-uvere.html&lang=ru&lr=1946562&win
-33542270	https://moscow/episode-com.tr/dizi-gunleri/kopevsk/?one=zoneid=2073/?frommanduyuruindex.ru/yandex.ru/yandex
-33542270	https://hugesex.tv/th/ญี่ปุ่น-slozhnoe.ua/villa_199855362
-33542006	http://7ya.ru/Video/embed
-33542002	http://gaz/2117/start.tv/?cutter&l10n=ru&lr=56&text=смотреть
-33541260	http://yandex.ru/filmId=ydx&iv=ZLZHVUVlsySgV
-33541260	http://yandex.ru/filmId=ydx&iv=ZLZHVUVlsySgV
-33541260	http://fast-trybu-viyskiy-yagoji.com
-33541260	http://fast-trybu-viyskiy-yagoji.com
-33541260	http://fast-trybu-viyskiy-yagoji.com
-33541260	http://fast-trybu-video/83506.html?themoscow/90/inciden sans-viborsa/#788
-33541222	http://mg.mgshare.com/r2/playerinvestions/629807703503541977079
-33541084	http://yandex.ru/news.yandsearch?text=нара 2 на начнеток&img_url
-33541084	http://yandex.ru/news.yandex.ru/polovo_20014, это такой Александр по порно сантехник
-33540897	http://small.ru/yandex.ru/photosession
-33540564	http://wwww.forexpf.ru/Onliner.ru/spaces.ru/
-33540564	http://wwww.ford_id|8610871/train-danies/skachenie
-33540564	http://wwww.ford-sparolevka.bigmir.net/ru/post/video-food/detskij-troit/
-33540506	http://news/bannetteyen-sostan.ua/kids=67774.1395223/19/chastnikapelleri.gen.tr/oauth_sig=d7e8342341&lr=25&secret=9c4c5ecf578b7f3
-33540506	http://news/bannettey.ru/retarutop&text=в контакте&clid=13953422.1395129/index.ru/my/messa
-33539800	http://clubmansk.rabota
-33539286	http://all/pala-deistvennoreask=1
-33538555	http://kler.ru/video/warplanberri.net/
-33538396	http://finans.html&tld=ru
-33537935	http://yandex.ua/politics/17513810d4fgdTWw..
-33537265	http://yandex.ru/pers/1-0-671-kompyuterologinza.ru/id/111/149/milltext
-33536919	http://aydan&type=2&sort=natik.ua/desktop/in/80949
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=2738
-33536857	http://spartmentHelper&id=24086074727284&t=2&pos=29&hotels.html
-33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
-33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
-33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
-33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
-33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
-33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
-33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
-33536857	http://spartmentHelper&id=240002152955821-deti/yandex.ru
-33536857	http://spartmentHelper&id=240&text=стоит
-33536857	http://spartmentHelper&id=240&text=герб россия, Республик
-33536771	http://konster.ru/yandsearch?clid=1222/480786176723/?from
-33536771	http://konster.ru/yandsearch?clid=1222/480786176723/?from
-33536771	http://konster.ru/v-rossiya?n=2506461
-33536771	http://konster.ru/v-rossiya?n=2506461
-33536771	http://konster.php?Itemid=217867427535/?refreakinelegraf.html/ru/read.php
-33536771	http://konster.gs.html/russichat/188077.html&former.ru/yandex.ru/0000000762
-33536771	http://konster.gs.html/russichat/188077.html&former.ru/yandex.ru/0000000762
-33536771	http://konster.com/?fb_source=vk&refererigroka-klub
-33536771	http://konster.com/?fb_source=vk&refererigroka-klub
-33536771	http://konster.com.tr/oauth=0&drivery/en/search=Отправильные фильм
-33536771	http://konster.com.tr/newreg=1&auth.rosrees
-33536771	http://konster.com%2Fnews.liga.net/journal
-33536588	http://autone.html&gm=1&lang=ru
-33536164	http://wotlaunchestvij-posts%2F2014/03/20/post.com/en/spravda.ru/neli.html?item_id=040103062&text=set
-33535954	https://e.mail.yandex
-33535840	http://yandex.ru/newsru.com.tr&user_id%3D84845.17.30.13953979&text=саламбрекены
-33535746	http://wot/htm/wotlauncher.html&lang=ru
-33535713	http://amk-widget/?overny
-33535713	http://amk-widget/?overny
-33534920	http://collash%3D2%26check=0&lang=ru&lr=1139&text=приколепный
-33534613	http://topbest-fears.ru/nachali
-33534534	http://kolesinda-nachinov-site_slot
-33534469	http://small.com.tr/gunesia-mona-i-post.ru/yandex.ru/forbes
-33534454	http://favto-referentop.ru/questink.com&public%2F20140317/218502595&metroveschits/24000092766
-33534116	https://male-hologinza.ru/Krist.org/radioveshilapii-2013-06-03-22
-33534056	http://cybers.com/index.ru/krashivai.ru/fp/derinburg/mototours
-33534056	http://cybers.com.ua/sprashirsk
-33533945	http://sefania/acers[]=3&ptl=0&clid=9403&lang=ru&lr=23&clid=993105-20338816573.18858.139539063&acce
-33533945	http://sefania/acers/oley.html?html/ru/video/search?cl4url=http://home/politics/1700475_0&rnd=9582
-33533945	http://sefania/acerfax.ru/Suzuki_zavtrax.com/r/rbc.ru/Mukhi-spletnie-luchat.com/webcache/amk-windows
-33533945	http://sefania/acereshebnik/102451185/?ref=http:%2F%2Fimage&lr=113&text=мультики&clid=1985544
-33533945	http://sefania/aceramtp.info=sw-1349-wh-768-ww-1351&rpt=simages/inbox/728x90/?from=7&templatotv
-33533945	http://sefania/acerambler.ru/Отели
-33533945	http://sefania/acerambler.ru/yandex.ru/yandex.ru/polikar.info
-33533945	http://sefania/acerambler.ru/yandex.ru/hotels/leonliner.bjk.html&lang=ru&lr=213&oprnd=65864284.html?html?stat=0&category/stesi.com
-33533945	http://sefania/acerambler.ru/yandex.ru
-33533945	http://sefania/acerambler.ru/pyat-zhens.ru/recipes-topol-tri-degistemy/messages/index.ru/lg/lg_optik.com/view.html#.UxDJCdiRHsBCx9
-33533945	http://sefania/acerambler.ru/publiconnId=199291385fb7308ec3ee12d0c263bd778bfaf924d6a121291&lr=236&text
-33533945	http://sefania/acerambler.ru/neo2/#inbox/?_1ld=1_10004182473169713.html?html/ru/kaluga.ru/yandex.ua
-33533945	http://sefania/acerambler.ru/neo2/#inbox
-33533945	http://sefania/acerambler.ru/moscowmap.php?p=3&clid=1989274
-33533945	http://sefania/acerambler.ru/menu.ru/yandex.ru/neo2/#inbox/?lang=ru&lr=13&clid=205519&text=закупки плакал на тильних
-33533945	http://sefania/acerambler.ru/list?folder
-33533945	http://sefania/acerambler.ru/inworld of MFP
-33533945	http://sefania/acerambler.ru/from=formit
-33533945	http://sefania/acerambler.ru/disk.ru/yandex
-33533945	http://sefania/acerambler.ru/desk.spb.rabota
-33533945	http://sefania/acerambler.ru/content.ws/grinews.yandsearch=FZ
-33533945	http://sefania/acerambler.ru/commu-dva
-33533945	http://sefania/acerambler.ru/cards.a5ltd
-33533945	http://sefania/acerambler.ru/action=1.29081
-33533945	http://sefania/acerambler.ru/51/dollakov-pro.ru/neo2/#inbox/?lang=ru&lr=65&noreask=1&secret=cook-tv.ru/news-14546403357&a_id=vyZ1DKVQDYH08ZCc4FHhcJkMuAiYIHhMJWjIMES0QIhcpFx1xND5WWktYejZaOG9QWWt2ZAVfUFlATAV7QV9Gempe
-33533945	http://sefania/acerambler.rotahabr.ru/korre/politics/game-online.at.ua/?ll=37.61767/?page=0&pos=6.0.2&vers.ru%2F2014-h154&noreask
-33533945	http://sefania/acerambler.net/ru/theme=default
-33533945	http://sefania/acerambler.mirovanie-foto
-33533945	http://sefania/acerambler.html_part182434
-33533945	http://sefania/acerambler.com/web/webhp?espv=1&ie=UTF-8&l=vi&p=AhY_cQVTQQZLAVEDZFcJG1F4XldReWVtUEhEGHVfV1dnY3wPFWVyGmMFVRgHC0JdUyd7NGJzCHd7dVNSTlppOG1
-33533945	http://sefania/acerambler.com/index.ru
-33533945	http://sefania/acerambler.com/futbol/Russing-skforummaonliner.raiserapidfilmId=qFYW5kZXgucnUvaGVua28
-33533945	http://sefania/acerambler-games.mail
-33533945	http://sefania/acerambler&utm_campbell
-33533945	http://sefania/acer_18_id448ecc0fddf4
-33533945	http://sefania/acer.ru/yandex.ru/?p=3&carfinCar%3D11921052307886.281500.159318&curre.ru/article
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-sum=100&lr=213&noheader
-33533945	http://sefania/acer-dodgeraturalsk/motobralime.ru/yandsearch_kodelicheskim_kachej-i-pidzhanyy-za
-33533945	http://sefania/acer-chto-vip-cakir-ilk-test-help.2gis.ru/postuchastnicyn-prezident.su/forum.ucoz
-33533945	http://sefania/acer-amatvii-kili-pro-zhiznyu-needineniya-2012/04/hata.ru/name=d7f4a6a2bb32c889713463181048
-33533945	http://sefania/accountrysis
-33533945	http://sefania/accountry":1,"bdate:descript/segodnya
-33533945	http://sefania/accountry
-33533945	http://sefania/accounter.start.airline/popular/1/o-patrix.ru/yandsearch?p=175&viewtopic/77-1-0
-33533945	http://sefania/accounter.start.airline.sberbankionline.html?id=1879974,55.7868151049.139540135
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/accounter.ru/yandex.ru/neo2/#messages.yandex.ru
-33533945	http://sefania/account
-33533945	http://sefania/account
-33533945	http://sefania/account
-33533945	http://sefania/accordsPerPage
-33533945	http://sefania/accords&projects/chto-delat_rassyobse-v-zhit_list
-33533945	http://sefania/accords&projects/12807.html?t=1106/#photo.qip.ru
-33533945	http://sefania/accords&projectId=403170558%26customat-avtomashniy
-33533945	http://sefania/accords&projectId=18827.html#47
-33533945	http://sefania/accords&project-syn-sonuclari
-33533945	http://sefania/accords&project-strelyam-v-porner_click_id=2413714e82e72
-33533945	http://sefania/accords&project-site_id=40317%2F03%2F1000000.html
-33533945	http://sefania/accords&project-site_id=0&is_app_id=20836&group=6079
-33533945	http://sefania/accords&project-site_id
-33533945	http://sefania/accords&project-site=actic.livetv.sx/lenta.ru/moscow
-33533945	http://sefania/accords&project-site.ru
-33533945	http://sefania/accords&project-site-lyubvi
-33533945	http://sefania/accords&project-sinin/?news
-33533945	http://sefania/accords&project-sini-chi
-33533945	http://sefania/accords&project-simite-nauchnistration
-33533945	http://sefania/accords&project-proissha
-33533945	http://sefania/accords&project-partnaya
-33533945	http://sefania/accords&project-pamyatilsya.html/rus/news.yandsearch
-33533945	http://sefania/accords&project-nauchenprosport
-33533945	http://sefania/accords&project-natu-vodons/kalitics/5629499954055
-33533945	http://sefania/accords&project-namics%2F03
-33533945	http://sefania/accords&project-namer-4
-33533945	http://sefania/accords&project-name=aa642af6c9
-33533945	http://sefania/accords&project-name=&p
-33533945	http://sefania/accords&project-name":"Красная
-33533945	http://sefania/accords&project-nalog.com
-33533945	http://sefania/accords&project-nalog-global
-33533945	http://sefania/accords&project-nala.com
-33533945	http://sefania/accords&project-na-zhelises.name=Zombi/25-pevchukovich
-33533945	http://sefania/accords&project-na-photofunia
-33533945	http://sefania/accords&project-na-kefirebitelstva_ukrainala_gosobytiya
-33533945	http://sefania/accords&project-na-kachat
-33533945	http://sefania/accords&project-na-detskie
-33533945	http://sefania/accords&project-na-deputati
-33533945	http://sefania/accords&project-na-dairy-iz-pena.com/obozrevatehomeapps
-33533945	http://sefania/accords&project-female bold man/vacancy3446133&text
-33533945	http://sefania/accords&project-favoru.com
-33533945	http://sefania/accords&project-favori_derejit
-33533945	http://sefania/accords&project-famme=08
-33533945	http://sefania/accords&project-familyspaces
-33533945	http://sefania/accords&project-familyeva
-33533945	http://sefania/accords&project-PF=214937
-33533945	http://sefania/accords&project-PF=214748165.html?ext=комедії
-33533945	http://sefania/accords&project-PF=214283
-33533945	http://sefania/accords&project-PF=18084
-33533945	http://sefania/accords&project-PF=180&CarType
-33533945	http://sefania/accords&project wars-3-sezon-2-bolumia 7107836/
-33533945	http://sefania/accords&project wanitelstvo_menenta-uaz-po-vinni
-33533945	http://sefania/accords&project - Reckout/coverrikov-service-antier
-33533945	http://sefania/accord
-33533945	http://sefania/acciya
-33533945	http://sefania/access_perekrasnogo
-33533945	http://sefania/access_perekrasnogo
-33533945	http://sefania/access_perekrasnogo
-33533945	http://sefania/accebback_url=ria.ru/person/1126-yubimogo-obstvennok
-33533945	http://sefania/accebback_url=ria.ru/person/1126-yubimogo-obstvennok
-33533945	http://sefania/accebback_url=ria.ru/person/1126-yubimogo-obstvennok
-33533945	http://sefania/accebback_url=http://ulogin?next=сс карта-pochi/zvezdov/teente_200599&api
-33533945	http://sefania/accebback_url=http://rdfo.ru/neo2/#inbox/?back=1&source=googogic/start=0&costudia
-33533945	http://sefania/accebback_url=http://bfm.ru/be.php?f=2892.2177/blogs.yandex.ua/category/pass.com
-33533945	http://sefania/acceb9191d
-33533945	http://sefania/acce163a15ca1cda8e
-33533945	http://sefania/accbook
-33533945	http://sefania/academika
-33533945	http://sefania/academic.academo/mazdanie-parner.by/
-33533945	http://sefania/ac/auto.ru/neft-autoStart
-33533945	http://sefania/ac/auto.ru/neft-autoStart
-33533945	http://sefania/ac/auto.ru/neft-autoStart
-33533945	http://sefania/ac/auto.ru/neft-autoStart
-33533945	http://sefania/ac/auto.ru/neft-autoStart
-33533945	http://sefania/ac/auto.ru/neft-autoStart
-33533945	http://sefania/ac/auto.ru/neft-autoStart
-33533945	http://sefania/ac/auto.ru/neft-autoStart
-33533945	http://bonprix.ru/2014/912338.html&lang=ru&lr=20569
-33533815	http://gyps.ru/modul.rambler.ru/welcome/popgun.ru/yandsearch?clid=1923030318/1513475
-33533815	http://gyps.ru/modul.rambler.ru/welcome/popgun.ru/yandsearch?clid=1923030318/1513475
-33533815	http://gyps.ru/modul.rambler.ru/welcome/popgun.ru/yandsearch?clid=1923030318/1513475
-33533815	http://gyps.ru/modul.rambler.ru/deales-posobiyane_iz_kottei-200398904&text=как
-33533815	http://gyps.ru/modul.rambler.ru/deales-posobiyane_iz_kottei-200398904&text=как
-33533706	http://zp.php?carfinTpl%3D//adultmir.ru/yandex.ua/obyasnenie-vozduh
-33533559	http://10kp
-33533559	http://10kp
-33533554	http://zhannaliz/yandex.ru/rubric/194-adekvator%2Fyayinskij-kaldirme
-33533554	http://zhannaliz/showbiz
-33533341	http://newsru.com/webhp?espv=1&ie=UTF
-33532815	http://zerx.ru/moscow/ru/dzerzhd-vipstatuazh-prigotovij-neobraznye_chem/signup/?from=email.ru/sport.ru/news/tits-forums
-33532556	https://expertyj_redir-1440&cation.html&lr=10347-v-rublya-pritsell
-33532217	http://tulus-oblagovopoltsou.com/top100
-33532142	http://image&lr=4&text=часы
-33532021	http://ld.ru/test1.radiorecheski-na-domachnomu-karpatents
-33532021	http://ld.ru/test-dney-payi-teknology.ru/tzarin-durnals.tv/movies.ru/prom.news.ru%2Fimg1.livejournal
-33531865	http://wotlauncher/frau-line
-33530939	http://pda.net/downloader_ben_10_legend.ru
-33530939	http://pda.net/download/zapgames.ru/vidyat-lyubov.com.tr&callback=1&search?lr=65&redircnt=13952471887
-33530939	http://pda.net/download/tv_taris-yerel-i-grania/sale/48828-fin.html
-33530939	http://pda.net/download.html?html?id=1955405805/24/market.ru/inbox/?lang=ru&lr=213&text=санкции Детский
-33530767	http://e.mail.rambler.ru/idei.ru/yandex
-33530735	http://rambler.ru/viewer_id
-33530351	http://minprokurortmanfirmudahan/an140318
-33530351	http://minprokopievsk.ru/kiev.pro/commepage=0&sid=8082872.139517112091842&win=111139518073.shmini-aviabil-footovit
-33530351	http://minproklassniki.ru/mozila-fokushek.html&lang=ru&lr=14&l=map,trfe&trfm=cursii-otvetics%2Fpremika_karmens.com.html?pid=90991
-33530351	http://minproki.ru/new/adsensek_oon_objazanie/139515&clid=9582&text=адрес свежие на австрижак день секс
-33530351	http://minproki.com/erike-dlya-bgg108348/1243669&sig=6baa7f9d6b799548339/?promeclipy/1-1-600-1-0-200713/?promo
-33529744	http://medcezirovka-chet-album_id
-33529744	http://medcezirovka-cher.html&language
-33529548	http://tyzhdenii_kryim_v_hers/4608&#96086_14
-33529548	http://tyzhdenii_kryim_v_hers/4608&#96086_14
-33529548	http://tyzhdenii_kryim_v_hers/4608&#96086_14
-33529548	http://tyzhdenii_kryim_v_herost-perm=dista
-33529548	http://tyzhdenii_kryim_v_herost-perm=dista
-33529548	http://tyzhdenii_kryim_v_heroes/?id
-33529548	http://tyzhdenii_kryim_v_heroes/?id
-33529548	http://tyzhdenii_kryim_v_herkala.hh.ru/neo2/#inbox/?back=141&recipes
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=wDt3YsGMq3A
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=qEilHuuWUXI&where=all
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=kBGsbFhZHmE
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=kBGsbFhZHmE
-33529548	http://tyzhdenii_kryim_v_here=all&filmId=kBGsbFhZHmE
-33529548	http://tyzhdenie.biz/arabatyur-percy/
-33529548	http://tyzhden.ua/news.tut
-33529494	http://pozdravov/politics/101.184574
-33529494	http://pozdravlenii-v-rossiya
-33529346	http://yandex.ru/image&lr=65&text=провение
-33529346	http://yandex.ru/image&lr=65&text=жажданство
-33529300	http://yandsearch?text=стасия","last/woid/igra.html/Article-16.html#object.ru/aim_minutes=0&page/13955768&spn=0.2373&is_settis
-33529300	http://yandsearch?text=спертеристика
-33529300	http://yandsearch?text=спертеристика
-33529300	http://yandsearch?text=Где купить бесплатно&where=all&text=текст&lr=115&lr=213
-33529300	http://yandsearch?text=Где купить бесплатно&where=all&text=текст&lr=115&lr=213
-33529300	http://yandsearch?text=Где купить бесплатно по волчонок
-33529300	http://yandsearch?cl4url=wwww.rg.ru/inregistercontent%3D52%26width%3Dhttp://tatskoy-bolum.html/ru/filmId=c172
-33529300	http://yandsearch?cl4url=wwww.rg.ru/inregion43=43&text=корая-страница&clid=9403&lr
-33529300	http://yandsearch?cl4url=wwww.radikal.com.tr/Umutsu-ve-en3.html&sig=7c2bd3852134
-33528566	http://mudrosti.ru/cgi-bin/msglishero-vsemag.ru/yandsearch
-33528516	http://amkspo-2010-03-2012-30-let-siti.ru/custoshok-video/searcher
-33528246	http://auto.yandsearch?text=юлия мурмановидео майнкрафт картак 1 серия&clinic/psafe.com/diziizle
-33527130	http://yandsearch?text=в конструкция
-33527130	http://yandex.do&returnir_8833654666.html_parali-vo-ves-shop.com/dom-instroisam.com%2Fsmall.com.ua/neo2/#inbox
-33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
-33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
-33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
-33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
-33527130	http://yandex.do&returney-yuho-voprogrammy/igra-ahedzhi/korole_hincidizi/medgorod
-33527130	http://yandex.do&returnUrl=http://finance.turmovie/bolshoyvoprostok/62765-fh-585-viyskoy
-33527130	http://yandex.do&returnUrl=%2Fhappy birthday=3713/hotelClass.ru/yandex
-33527130	http://yandex.do&returnUrl=%2Fhappy birthday=3713/hotelClass.ru/yandex
-33527130	http://yandex.do&returnUrl=%2Fhappy birthday=3713/hotelClass.ru/yandex
-33527130	http://yandex.do&returnTo=Q833EiAcUXI&path=wizard%3D1027269.139521023600000&language
-33527130	http://yandex.do&returnTo=Q833EiAcUXI&path=wizard%3D1027269.139521023600000&lang=ru&lr
-33527130	http://yandex.do&returnDateTo=2419171971/?gcv_society/177-yatsya-v-dukhod
-33527130	http://yandex.do&returnDateTo=2419171971/?gcv_society/177-yatsya-v-dukhod
-33527130	http://yandex.do&return&from=link]-250-mercher.html/ru/land-parkompyuterermalinkvac.php/tophotostransonhaber7.com
-33527130	http://yandex.do&return&from=link]-250-mercher.html/ru/land-parkompyuterermalinkvac.php/tophoto.html/ru
-33527130	http://yandex.do&return&from=link]-250-mercher.html/ru/land-parkompyuterermalinkvac.php/tophoto.html/ru
-33527130	http://yandex.do&referre=all&text=киногород&clid=1697451&lr=213&noreask=1&source
-33527130	http://yandex.do&refererigroselki-dlya-terrovenirov/klerkel_zvuki-kofeynye-xrom
-33527130	http://yandex.do&refererigroselki-dlya-terrovenirov/klerkel_zvuki-kofeynye-xrom
-33527130	http://yandex.do&redition=RU,43,Lipetsins_crd_1991793-fw-1351-wh-634-aciklama-laman-online.ws
-33527130	http://mama-terrobegom/cp/110026/biogram/676-tyis--gul-alinki/communit=-1&start=1&quickpay
-33525856	http://yandex.ru/video/search?lr
-33525856	http://yandex.ru/video/embed/659
-33525856	http://yandex.ru/video/embed/659
-33525822	http://yandex.ua/content&viewer_type=0&ad_info.com.ua/news.liga
-33525822	http://yandex.ua/content&viewer.php?routeshant/regist/406-85AB-43F0-92f0-055fea7ep
-33525822	http://yandex.ru/yandex.ru/onlinenie-baisvip.php?query=Беларусь
-33525791	https://megafon_category/1-chtovo/item/3971/?from=wizard&films/family
-33525532	http://xxxsuchku-i-shit_ligii
-33525532	http://xxxsuchku-i-shit_ligii
-33525532	http://xxxsuchku-i-shit_ligii
-33525532	http://xxxsuchku-i-shit_ligii
-33525419	https://rus.ru/Интернышов
-33525419	https://rus.ru/Интернышов
-33525419	https://rus.ru/statyi-i-i-bin/msglistvo
-33525419	https://rus.ru/addriver.ru/?api_url=http://meteo
-33525327	http://yandsearch?lr=213&msid=2083696&from
-33525327	http://yandsearch?lr=213&msid=2&rg_viewcats.aspx
-33525276	http://yandex.ru/neo2/#inbox/?back
-33525276	http://yandex.ru/neo2/#inbox/?back
-33524989	http://maximytishinfo/infodochok
-33524989	http://maximytishinfo/infodochok
-33524690	http://vampionalnyi-sux.com/fr/#ling.net/video/cfa.su/load
-33523429	http://yandex.ru/yandex.ru/yandex
-33523429	http://yandex.ru/yandex
-33523429	http://yandex.ru/rates
-33523021	http://yandex.ru/pro-po-rus-to/today/Visitor-site_id%3D1%26lang
-33523021	http://yandex.ru/flirtina-zdorojnoe
-33523021	http://yandex.ru/flirtina-zdorojnoe
-33523021	http://yandex.php?t=1659.html%3Fid_clips.com
-33523021	http://yandex.do&returnUrl=http
-33523021	http://kinoptice-ruchni_207815367.shtml?html&language
-33523021	http://home-provoloch.ru/yandsearch?text
-33523021	http://home-provoloch.ru/yandex.ru/yandex
-33523021	http://home-provoloch.ru/yandex.ru/views
-33523021	http://home-provoloch.ru/yandex.ru/news.yandex
-33523021	http://home-provoloch.ru/world.guns.all.com
-33523021	http://home-provoloch.ru/word}&referers_android
-33523021	http://home-provoloch.ru/vidomchannerstyle/begemennyy-love
-33523021	http://home-provoloch.ru/video/search?lr=213&msid=292324%2F03%2F2014
-33523021	http://home-provoloch.ru/video.html?pid=b473b0c79b3ab2d0b0d18bd0b10747
-33523021	http://home-provoloch.ru/sluzhil-prografii
-33523021	http://home-provoloch.ru/sluhar-in-cinka
-33523021	http://home-provoloch.ru/semeyen-more/Default.ru/yandex.ru/naborisoedineniya
-33523021	http://home-provoloch.ru/novostika-doktoraya-skoraya-griver.ru/politnyi
-33523021	http://home-provoloch.ru/news.yandsearch?cl4url=wwww.hurriyet.com
-33523021	http://home-provoloch.ru/meetindal_sub=26.04919705/reporno.com.ua
-33523021	http://home-provoloch.ru/index.ru/11638455b9febd2
-33523021	http://home-provoloch.ru/home.net/range&text
-33523021	http://home-provoloch.ru/?yaso-porniac.com/yozga_viyskaya-aksession
-33523021	http://future
-33523021	http://future
-33523021	http://future
-33523021	http://future
-33523021	http://future
-33523021	http://future
-33523021	http://future
-33523021	http://future
-33523021	http://future
-33523021	http://future
-33522421	https://worldofwarplanshet.html/hu/priceli-yayconsultatistart&s=89628/?from=6009155113/ghost%3D6459119&nohead=2&job_index.ru/politics
-33522421	https://worldoftankov-gormovie/6639/doram.ru/moscow/plama-alphant.ru/2327/univer
-33522421	https://worldoftankov-gormovie/6639/doradonloads/Как_и_волжской_округловы
-33522421	https://worldoftankov-gormovie/6639/doradonloads/Как_и_волжской_округловы
-33522421	https://worldoftankov-355678268/?promo&limitings=27103052/?cid=5883-prodam
-33522421	https://worldoftankov-355678268/?promo&limitine_6/
-33522421	https://worldoftankov-355000e43fd419fbf2c35cf
-33522421	https://world/ukrasotyi-prog.html?uid=ajZ1DLp0/mark_app_id=vyZ1DLClUJZlcJG1F4XldSeWtvVkFkf38xIAEsQVgWCVtUekB
-33522421	https://world/ukrasotyi-prog.html?uid=ajZ1DLp0/mark_app_id=vyZ1DLClUJZlcJG1F4XldSeWtvVkFkf38xIAEsQVgWCVtUekB
-33522421	https://world.eu/index.ru/optik.ua/yandsearch?text=стать стихи для с мажор
-33522421	https://world.eu/index.ru/optik.ua/yandsearch?text=смотреть
-33521626	http://yandex.ru/yandsearch?lr=44&redict/season
-33521536	http://russinskie_otnostno-vsegodnya
-33520995	http://a1.s7.fsimg.ria.coccoc.com.br/instruktov_perm.ru/news_6_sot._snt_detay
-33520995	http://a1.s7.fsimg.info/meden-seriya-hollassniki.ru/Oboi
-33520995	http://a1.s7.fsimg.com/vse_seksklyuchenie-igry
-33520995	http://a1.s7.fsimg.chitels/es-model.xml?typ=RET&anbietersburg
-33520995	http://a1.s7.fsimg.avoncon.net.ru/rabota.ru/politics/174880%2F9999996657844.html#top_apress
-33520925	http://yandex.ru/shop/wotlauncher
-33520579	http://traveldudingsportal.ru/sverhosti.ua
-33519953	https://e.mail=1&quickpay=38cd0b3d0b2d0bed180d177b-99f0-055f44e7f142bb41c743890
-33519953	https://e.mail.yandsearch?clid=479802000/000286567.html/ru/news.yandsearch?lr=43&noreask=1&source
-33519953	https://e.mail.yandsearch?clid=479802000/000286567.html/ru/news.yandsearch?lr=43&noreask=1&source
-33519953	https://e.mail.yandsearch?clid=479802000/000286567.html/ru/news.yandsearch?lr=43&noreask=1&source
-33519953	https://e.mail.yandsearch?clid=479802000/000286567.html/ru/news.yandsearch?lr=43&noreask=1&source
-33519953	https://e.mail.yandsearch?clid=1_30008434634632.html?vac_page3/out-of-tanceret545
-33519953	https://e.mail.yandsearch?clid=1_100002c&_cpofid=5310758&text=ГЕРОБРАЗОВОЕ
-33519953	https://e.mail.yandsearch?cl4url=www.milii.ru/politics/1892.32279/product/134.4132/164310231099_2991eaealty
-33519953	https://e.mail.yandex.ru/yandsearch&area=vac&subishi_dlya
-33519953	https://e.mail.yandex.ru/msk/12812112538%26bn%3D3239658%26bt
-33519953	https://e.mail.yandex.ru/msk/12812112538%26bn%3D3239658%26bt
-33519953	https://e.mail.yandex.ru/medley7/article/14Mar2014/91243-v-kharniturgical-budet-haber/yandex.ru/kategory_from=odnoklassniki.ru
-33519953	https://e.mail.yandex.ru/7/champaign=nw&utm
-33519953	https://e.mail.ru/yandex.ru/c/m.exe/htm/wotlauncher.ru/naifl.ru/actualiday=1#video/search?textpesni_duhovke-vozil-ex.ru/?clid=13954055
-33519953	https://e.mail.ru/neo2/#inbox/
-33519953	https://e.mail.ru/neo2/#inbox/
-33519953	https://e.mail.ru/bit2bit.net/209228_900b9018.html?id=c19
-33519953	https://e.mail.ru/beremennok/sharelii.ru&devices-brics/89822/rosbalta.ru/mail.rambler.ru
-33519953	https://e.mail.ru/Portal_onlayn-igrovya/29474?sid=246411740685&country_params=rhost%3D52%26pz%3D11555_Turkey.com/viewer_novily_dlja
-33519674	http://best.kupit.ru/yandex.ru/sankt-petrovishi.ru/2004d3c53
-33519674	http://best.kupit.ru/yandex.ru/sankt-peter=814409631/?from=ohmb_city=0&uinfo=ElsdCQJUQxJThCwNSAxI3MSc4LiY4AxtuASgHIAgbOn98cV9TVkZNcQsyXkZ4
-33519236	http://yandex.ru/page.biz/17/99999/2014/19240&PrefFrend
-33518904	http://rambler.ru/stattorgnut-Krimult
-33518904	http://rambler.ru/stattorg.ua/hobbilein/msglistakeforex
-33518904	http://rambler.ru/stattorg.ua/hobbile
-33518904	http://rambler.ru/stattorg.ru/106460a
-33518904	http://rambler.net/5927&text=говориль  
-33518904	http://rambler.net/5927&text=говориль  
-33518406	http://delta/htm/wot/htm/wotlauncher.ru/prography.html 
-33518406	http://delta/htm/wot/htm/wotlauncher.ru/prography.html 
-33518406	http://delta/htm/wot/htm/wotlauncher.ru/prography.html 
-33518384	http://svprestatusi_prede
-33518384	http://svpressid=238&lr=63
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpressages.yandex.ru/ekonov
-33518384	http://svpress.ykt.ru
-33518384	http://svpress.yandex.ru/yandex.ru/memoryachi/zhere
-33518384	http://svpress.yandex.ru/questions/volgogram/1-koman
-33518384	http://svpress.yandex.ru/messabota
-33518384	http://svpress.com/webhp?espv=1&ie=UTF-8&l=vi&p
-33518384	http://svpress.com/webhp?espv=1&ie=UTF-8&l=vi&p
-33518384	http://svpress.com/staforizaciya-anars.com.tr&user
-33518384	http://svpress.com/staforizaciya-anars.com.tr&user
-33518384	http://svpress.com/istanoy-v
-33518384	http://svpress.com/apps&lc_name
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chulkax-v-dengangbalta
-33518384	http://svpress-chto-dizajn-trip.bg/новости телефоны
-33518384	http://svpresennyy-bosch
-33518384	http://svpresennyy-bosch
-33518384	http://svpresennium.com/adam/istory
-33518384	http://svpresennitsya_vzhe_pravkatalog
-33518384	http://svpresennij-sposolstory
-33518384	http://svpresennie-za-fenews.mail.ru/news/sankcii-products/vsepostupaemyj
-33518384	http://svpresennie-inculatotv.tv
-33518384	http://svpresennie-e-n-v/mediaget
-33518384	http://svpresennie-1905-voevatelya
-33518384	http://svpresennetteyzen.com/categoryId
-33518384	http://svpresennet.ua/yandsearch?cl4url=rusnoe-komani
-33518384	http://svpresennet.ua/news.yandex
-33518384	http://svpresennet.com/load/gta_4_godetoedet
-33518384	http://svpresennet.com/load/godonskim.html
-33518384	http://svpresennet.com/ghitsya-vzjali
-33518384	http://svpresennet.com/?cid=1_843
-33518384	http://svpresennet.com.tr/D/Genel
-33518384	http://svpresennet.com.tr/?win=104&company=5
-33518384	http://svpresenner_viewertyvanlatım
-33518384	http://svpresenner/5bd56db9c088f0
-33518384	http://svpresenne-vinny_frommail
-33517550	http://telebek.com/notification.by/yandsearch.html
-33516942	http://yandex.ua/describe.ru/yandex.ru/kak-managemennoletat
-33516942	http://yandex.ua/Shou-biri-dnjatija-vo-vremennoafishin/zhensk.ua/ukranov/56
-33516934	http://news.yandex.ua/world
-33516664	http://yandex.ru/yandex
-33516516	http://skazan/applanet_seengliysk
-33516436	http://childs=1000de
-33516285	http://coccoc.com/Informalnaya-trax.com.ru/politics
-33516126	http://forum.horo.mail.ru/volgoprove-did39
-33515878	http://yandex.ru/city=&name=Индийского развитие
-33515401	http://rg.ru%2Fplatno-kurganizmantasy-loko.ru/games.mail.yandsearch?cl4url=http://worldoftanks.ru/news/231518
-33515401	http://rg.ru%2Fplatno-kurganizmantasy-loko.ru/games.mail.yandsearch?cl4url=http://worldoftanks.ru/news/231518
-33515401	http://rg.ru%2Fplatno-kurganizmantasy-lohanks.eu/play.ru/autop&text=чемпионов зодиака смотреть фиат альма новые-вычет зубна&clid=1979770d066e1
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515401	http://rg.ru%2Fplanet.ru/ulyava
-33515167	http://clients/28767-nancy/ust-v-sina-nevestion/poppimer
-33514747	http://yandex.ru/new/ads
-33514322	http://center.ru/daily/svadba
-33513741	http://cum.mobile=0&clid=9403&lr=100&targets-hint=Ваше образца 20 03 2014/91159198
-33513616	http://news/1467113/ghost%3D52
-33512719	http://m.net/ukrinfo=ww-1263
-33512719	http://m.net/join/43-1-0-340138002aa
-33512719	http://m.net/join/43-1-0-340138002aa
-33512719	http://m.net/555/?fromName_geldigitar.com/page.aspx&refplaces
-33512719	http://m.net/548155&text=когда в рошем качество
-33512719	http://m.net/548155&text=когда в рошем качество
-33512719	http://m.net/548155&text=когда в рошем качество
-33512719	http://m.net/548155&text=когда в рошем качество
-33512719	http://m.net/221396/http://news.do?u_krymu-pro.com/webhp
-33512719	http://m.net/219/review/21204%26carfinABTest
-33512719	http://m.net/212549&z=12&lr=20139162721&text
-33512396	http://my.mail.ru/part3.mozi.com/aciklyuchebnoe-prezerogramming.net
-33512016	https://deep=1
-33512016	https://deep=1
-33512016	https://deep=1
-33511763	http://mynet.ua/yandex.ru/product
-33511664	http://yandex.ru/tolko_chit-novye-vyira-Superjob.ru/board
-33511664	http://yandex.ru/pelichkoj.html_partner.by/брение орная фильмы&where=Москва&from=vb-chromo=1036237/man/moto-vosti_mir__tymoshina.html
-33511664	http://yandex.ru/pelichkoj.html_partner.bjk.html/ru/video/embed/6959&referatura.html?id=148&ref[0][registema/article/301282361-timlari-v-ukraini-misterclock_new=0&pgesize=10036-salestate=100136/js/direct=face.com&publ/launcher.html?browsers/62610&text=однокласс
-33511664	http://yandex.ru/pelichkoj.html_parhomchyk_2/?cat=1820273&noreask=1&source=psearch
-33511664	http://yandex.ru/pelichkoj.html_parhomchyk_2/?cat=1820273&noreask=1&source=psearch
-33511664	http://yandex.ru/pelichkoj.html_parhomchelyambler.ru%2Fpolitics.cntd.ru/l/chart
-33511664	http://yandex.ru/pelichkoj.html_params=bid%3D243500040317/27870892&msid=208
-33511664	http://yandex.ru/pelichkoj.html_params=bid%3D243500040317/27870892&msid=208
-33511664	http://yandex.ru/pelichkoj.html_params=bid%3D243500040317/27870892&msid=208
-33511664	http://yandex.ru/pelichkoj.html_paradikal.com/ilanie-obama-lizhnyyeleries/ukraine.ru/?auth_key=a65625a2bd6a1212d8a2109.jpg","lasti-prigotovyatsiya-k-pravo-vneochatelemena/i/O2NmYS5zdTtTUFBDO2ltcDtjcmVkaXQ7?_rnd=2434802143/?frommatiza/
-33511664	http://yandex.ru/pelichkoj.html_para.html/ru/list.ru/yandex.ru/20140316&lr=143
-33511664	http://yandex.ru/messages.yandex.htm
-33511664	http://yandex.ru/cgi-bin/readsale/programmy/igri_bottogovaya
-33511664	http://yandex.ru/cgi-bin/readsale/programmy/igri_bottogovaya
-33511664	http://yandex.ru/catalog/anner
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33511664	http://yandex.ru/?strigki-2007-prodam_iz_sng.html&lang
-33510595	http://chel.ru/politics/2014/ft/resh-anons
-33509478	http://lenta.php/ru/video/torrealth/next официальные
-33509473	https://m.sprashivai.ru/news.yandsearch[engindex.ru/compeii
-33509211	http://mail.ru/infinited-microchurchi.html&lang=ru&lr=213&text=microssii.com.tr_mobil&id=72217356880
-33509211	http://mail.ru/infinited-microchnolgi-namenila
-33509211	http://mail.ru/infinited-microchnitsa-anneksisozluk.com.tr/yandex.ru/yandsearch?clid=47710/?33vkb
-33509211	http://mail.ru/infinited-microchka-pervy/benetra/detmi/salakomstva.ru/watch/GetInfo/index.ru/vladtime.in.ua/polismetisti
-33509211	http://mail.ru/infinited-microchistkinobig&mb
-33509211	http://mail.ru/infinited-microchevyh-svadebnye-special-2-skan-erdogan-ifada&text=порно
-33509119	http://cumhuriyet.com.ua/ru/legok-novosti-bulation/taunhaus-s-05_2014/03/http://inosty.ru/news/2014/903843&text
-33508674	http://server=ff000000E0WtY0PX0
-33508571	http://allogs/487838002003&text=массам
-33508571	http://allogs/487838002003&text=массам
-33508571	http://allogs/48783631/?frommail.ru/pda.net/gruzoviyah-Pytings/d/depo.ru/series/ural.ru/catalog.ru%2Findex.ru/copypastoyt-na-amonkey
-33508571	http://allogs/48783399760.13954034.html?MG=2
-33508571	http://allogs/487832945-zhizn/zhenskaya/read.php
-33508571	http://allogs/48783220/80
-33508571	http://allogs/487830&text=одноклассники
-33508571	http://allogs/48783-solitics/17476480&lang=en&clid=195f540a8aa0dd5f7c
-33508571	http://allogs/48783-shkolja-chit-petro[2]=&year][max]=300000001504
-33508571	http://allogs/48783-shkolja-chit-petro[2]=&year][max]=300000001504
-33508378	http://news%2F1000211214662012.html?play
-33507942	https://shou-posta-audiovkontent
-33507710	http://tv.yandsearch
-33507710	http://tv.yandsearch
-33507491	https://echo/realth.mail.ru/index.ru/Vidy_na_granpartments.com/menu_id=2055440421.13955691
-33507247	http://lostfilmId=eQBcVS5EOXAPJgcTeXEODBVyTAAoc24HKh
-33506962	http://yandex.ru/peopleniya_kompaniyah-i-skanding
-33506962	http://yandex.ru/peopleniya_kompaniyah-i-skanding
-33506609	http://sprovideolovu.html#44
-33506581	http://yandsearch?clid=9403&lr=35&mb_url=http
-33506211	http://clan.html?item
-33506004	http://otzyvaet-zacheski/2014
-33505909	http://politics/news.mail.ru/2011.ru/yandex.ru
-33505909	http://politics/3c0a6563
-33505909	http://politics/330/stars/usersedes
-33505864	http://kommunity/444
-33505536	http://tumby-izbank.ru/neo2/#inbox/?lang=ru&lr=141
-33505536	http://tumby-iz-droga.com/webhp?espv
-33505536	http://tumby-iz-droga.com/webhp?espv
-33505536	http://tumby-iz-droga.com/webhp?espv
-33505536	http://tumby-iz-droga.com/index.ru/
-33505536	http://tumby-iz-droga.com/index.ru/
-33505536	http://tumby-iz-droga.com/index.ru/
-33505536	http://tumby-iz-droga.com/index.ru/
-33505536	http://tumby-iz-droga.com.tr&callback
-33505536	http://tumby-iz-droga.coccoc.com.tr
-33505536	http://tumby-iz-dont_55108772351961-101061909644&text
-33505536	http://tumby-iz-dont_5510788/?from=splate.yandex
-33505536	http://tumby-iz-doneckout=1440&is_mobile=0&ads_apps.branchor-Speed
-33505536	http://tumby-iz-donec
-33505536	http://tumby-iz-domovest.ru/weather
-33505536	http://tumby-iz-domost&lang=ru_RU&back_url
-33505536	http://tumby-iz-domavku-na-17-64
-33505536	http://tumby-iz-domain=hurriyet.com/detail.ru/news.yandsearch
-33505536	http://tumby-iz-dom2.ru/yandex.ru/personal/yabancial/kuhnem-reshuriyet
-33505536	http://tumby-iz-dolzhskiy
-33505536	http://tumby-iz-dolzhna-bobruchik-mail
-33505536	http://tumby-iz-dolzhna-bobruchik-mail
-33505536	http://tumby-iz-dolzhenshhiny-dsx/alls/rubric[0]=29&check_id]=1&rawdata/adpreview
-33505536	http://tumby-iz-dolg
-33505536	http://tumby-iz-dokto
-33505536	http://tumby-iz-doka-vo-v-inetv.sx/evera-model/27906.html
-33505536	http://tumby-iz-dok.ru/5072&text=стоит купе
-33505536	http://tumby-i-zalog/detail/worldoftanks.ru/forum/v_odintsii
-33505536	http://tumby-i-zalog/detail/world/562949990&noreask=1
-33505536	http://tumby-i-zalog/detail/world.ru/yandex.ru/ecobal
-33505536	http://tumby-i-zalog/detail/womenskaya.net/football/ukraine
-33505536	http://tumby-i-sydney.yandsearch
-33505536	http://tumby-i-sydney
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gotovy-nemeckaja
-33505536	http://tumby-i-gaf-yaptions/q258616&group/ru/domashi-mnenii
-33505536	http://tumby-i-gaf-yaptions/q2538-fh-4554&text=01&uinfo/fotki
-33505536	http://tumby-i-gaf-yaptions/q2538-fh-4554&text=01&uinfo/fotki
-33505536	http://tumby-i-gaf-yaptions/q2531/meteo.ua/cat-maski.yandex
-33505536	http://tumby-i-gaf-yaptions/q225819743&lr=38&msid=20719545
-33505536	http://tumby-i-gaf-yaptions/q22537&text=джамайкл
-33505536	http://tumby-i-gaf-yaptions/q22537&text=джамайкл
-33505536	http://tumby-i-gaf-yaptions/q2084%26ar_page=0&ad_info=ElsdCQBaQ1JgAA1cEEVUXiN2A1RzBx5pU
-33505536	http://tumby-i-gaf-yaptions/q2084%26ar_page.com/sagitnaja-granit
-33505536	http://tumby-i-gaf-yaptions/q208049&lr=1103/?from]=2508&os
-33505536	http://tumby-i-gaf-yaptions/q208&lr=14&msid=22892.1140&domain
-33505536	http://tumby-i-gaf-yaptions/q208&group_id=66289.html/ru/launcher
-33505536	http://tumby-i-gaf-yaptions/q200
-33505536	http://tumby-i-gaf-yaptions/q200
-33505536	http://tumby-i-gaf-yaptions/q200
-33505536	http://tumby-i-gaf-yaptions/q200
-33505536	http://tumby-i-gaf-yapti.ru/video/online
-33505536	http://tumby-i-gaf-yapti.ru/politics/news
-33505536	http://tumby-i-gaf-yapti.ru/politics/17/12/2495.html/ru/Politics
-33505536	http://tumby-i-gaf-yapti.ru/inregion_type
-33505536	http://tumby-i-gaf-yapti.ru/index.jhtml
-33505536	http://tumby-i-gaf-yaponse":null}&referer
-33505536	http://tumby-i-gaf-yapon/rusfisha.yandex.ru/inworld%2F300628431.shtml
-33505536	http://tumby-i-gaf-yapon/rus/katalog/s/10012989-ios/382983/1/?h=f3ea
-33505536	http://tumby-i-gaf-yapon/rukove-wallpaper.ru/yandex.ru/news/news
-33505536	http://tumby-i-gaf-yapon/rukopasnoo.com/beconomi/monstructure.ru
-33505536	http://tumby-i-gaf-yapon/rukol/3444.61655095001&source=wizard&filmId
-33505536	http://tumby-i-gaf-yapon/rukodellik-141588941001653-fh-582-echomske
-33505536	http://tumby-i-gaf-yapon/rukodelirnye-pravda-i-avel/120628&text=референие
-33505536	http://tumby-i-gaf-yapon/rukodelirnye-pravda-i-avel/120628&text=референие
-33505536	http://tumby-i-gaf-yapon/ru/strech-voorolek.com/iframe/frm_index
-33505536	http://tumby-i-gaf-yapon/ru/steko.ru/mykazala-domarks&count/akcija
-33505536	http://tumby-i-gaf-yapon/ru/season_yandex.ru/building_matika/6006291
-33505536	http://tumby-i-gaf-yapon/ru/protyv-rossian.ru/world/ukrainoy_vystuplenie
-33505536	http://tumby-i-gaf-yapon/ru/neo2/#inbox/?back_url=http://yandsearch
-33505536	http://tumby-i-gaf-yapon/ru/lottories/mult/ru/lite/info.ru/yandsearch
-33505536	http://tumby-i-gaf-yapon/ru/launcher.html#post88580657429649.htm
-33505536	http://tumby-i-gaf-yapon/relax.ru/video/embed/4669dcebilitsev
-33505536	http://tumby-i-gaf-yapon/refilmId=LUlODAlRDAlQjUlRDAlQjAlMjZidCUFJiQgsBdx9
-33505536	http://tumby-i-gaf-yapon/ref-11e3-bareviews/vehicle_700/forumu/widget
-33505536	http://tumby-i-gaf-yapon/recipes/predsestrukturist.html_parhomchyk
-33505536	http://tumby-i-gaf-yapon/realtyim-ne-andz.tv/adwidget
-33505536	http://tumby-i-gaf-yapon/realty.ru/studies/catalog.ru/novoe-post
-33505536	http://tumby-i-gaf-yapon/realnuyut-kremle-sex-shokolove
-33505536	http://tumby-i-gaf-yapon/real/season/929451.1395343110877/?actions
-33505536	http://tumby-i-gaf-yapon/reads/vinti-products/view.html?id=79323
-33505536	http://tumby-i-gaf-yapon/readme.ru/free?r=a2g_48122900
-33505536	http://tumby-i-gaf-yapon/readfic/102237/intimchangestom
-33505536	http://tumby-i-gaf-yapon/read=10914622-echo.msk.ru/news.mailbox.ru
-33505536	http://tumby-i-gaf-yapon/read/upravda.com/galimat.com/iframe
-33505536	http://tumby-i-gaf-yapon/read/3474.html?id=5113adcentervalov
-33505536	http://tumby-i-gaf-yapon/read/343606591&text=красноярск
-33505536	http://tumby-i-gaf-yapon/read/270/n4p/4164%26bid%3D3712&lr=30&nost
-33505536	http://tumby-i-gaf-yapon/read.php?page=http://sozdatochet
-33505536	http://tumby-i-gaf-yapon/read.php/Городавцова Наталь
-33505536	http://tumby-i-gaf-yapon/read.adrive-arabota-cekiler/yurthaber
-33505536	http://tumby-i-gaf-yapon/raznyh-orgirl/politics-torreviewtopic/286699416
-33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
-33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
-33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
-33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
-33505536	http://tumby-i-gaf-yapon/razmnozhi_i_set=googogoman.ru/product_7168
-33505536	http://tumby-i-gaf-yapon/razlozhi.html&language=0&auth_sig=89a2cfbd
-33505536	http://tumby-i-gaf-yapon/ratings=25908.5847&text=вконтроль
-33505536	http://tumby-i-gaf-yapon/rais-list?folder=0&new
-33505536	http://tumby-i-gaf-yapon/rais-list?folder=0&new
-33505536	http://tumby-i-gaf-yapon/rais-list?folder=0&new
-33505536	http://tumby-i-gaf-yapon/rais-list?folder=0&new
-33505536	http://tumby-i-gaf-yapon/raint-pelmenitoff.ru/user=1&auth.aspx?wt
-33505536	http://tumby-i-gaf-yapon/raile.com/list?lang=ru&frame/?lang=ru&clid
-33505536	http://tumby-i-gaf-yapon/rada.com.tr/displat.ru/aboutiquests/creative
diff --git a/tests/queries/1_stateful/00183_cross_join_external.sql b/tests/queries/1_stateful/00183_cross_join_external.sql
deleted file mode 100644
index 346a473ff0b..00000000000
--- a/tests/queries/1_stateful/00183_cross_join_external.sql
+++ /dev/null
@@ -1,3 +0,0 @@
-CREATE VIEW unit AS (SELECT 1);
-
-SELECT CounterID, StartURL FROM unit, test.visits ORDER BY (CounterID, StartURL) DESC LIMIT 1000 SETTINGS max_bytes_in_join=1, max_rows_in_join=1;
\ No newline at end of file

From 4be7f1f9df31b300798ab6fc57ded270da4540b6 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 13 May 2024 17:26:15 +0000
Subject: [PATCH 275/289] Don't randomize some settings in 02941_variant_type_*
 tests to avoid timeouts

---
 tests/queries/0_stateless/02941_variant_type_1.sh | 2 +-
 tests/queries/0_stateless/02941_variant_type_2.sh | 2 +-
 tests/queries/0_stateless/02941_variant_type_3.sh | 2 +-
 tests/queries/0_stateless/02941_variant_type_4.sh | 3 ++-
 4 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/02941_variant_type_1.sh b/tests/queries/0_stateless/02941_variant_type_1.sh
index 4fb76532a05..22ca909a26e 100755
--- a/tests/queries/0_stateless/02941_variant_type_1.sh
+++ b/tests/queries/0_stateless/02941_variant_type_1.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspicious_variant_types=1"
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspicious_variant_types=1 --index_granularity_bytes=10485760 --index_granularity=8192"
 
 function test1_insert()
 {
diff --git a/tests/queries/0_stateless/02941_variant_type_2.sh b/tests/queries/0_stateless/02941_variant_type_2.sh
index 995b622b6bf..91ba0285bd8 100755
--- a/tests/queries/0_stateless/02941_variant_type_2.sh
+++ b/tests/queries/0_stateless/02941_variant_type_2.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspicious_variant_types=1"
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspicious_variant_types=1 --index_granularity_bytes=10485760 --index_granularity=8192"
 
 function test4_insert()
 {
diff --git a/tests/queries/0_stateless/02941_variant_type_3.sh b/tests/queries/0_stateless/02941_variant_type_3.sh
index 9fbdf6de8a7..8a039a02d6d 100755
--- a/tests/queries/0_stateless/02941_variant_type_3.sh
+++ b/tests/queries/0_stateless/02941_variant_type_3.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspicious_variant_types=1"
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspicious_variant_types=1 --index_granularity_bytes=10485760 --index_granularity=8192 "
 
 function test5_insert()
 {
diff --git a/tests/queries/0_stateless/02941_variant_type_4.sh b/tests/queries/0_stateless/02941_variant_type_4.sh
index f6eaf2fcc9a..b003bcdcef1 100755
--- a/tests/queries/0_stateless/02941_variant_type_4.sh
+++ b/tests/queries/0_stateless/02941_variant_type_4.sh
@@ -7,7 +7,8 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspicious_variant_types=1"
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspicious_variant_types=1 --index_granularity_bytes=10485760 --index_granularity=8192 " 
 
 function test6_insert()
 {

From 7e5fc0d61dadde80ab655e5c847c57d9310e4531 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 13 May 2024 18:05:59 +0000
Subject: [PATCH 276/289] Fix #63653

---
 src/Storages/VirtualColumnUtils.cpp                      | 9 ++++++---
 .../0_stateless/01115_prewhere_array_join.reference      | 1 +
 tests/queries/0_stateless/01115_prewhere_array_join.sql  | 6 ++++++
 3 files changed, 13 insertions(+), 3 deletions(-)

diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index e3cbff5f01b..cec55cefda2 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -219,7 +219,7 @@ void addRequestedPathFileAndSizeVirtualsToChunk(
     }
 }
 
-static bool canEvaluateSubtree(const ActionsDAG::Node * node, const Block & allowed_inputs)
+static bool canEvaluateSubtree(const ActionsDAG::Node * node, const Block * allowed_inputs)
 {
     std::stack<const ActionsDAG::Node *> nodes;
     nodes.push(node);
@@ -228,7 +228,10 @@ static bool canEvaluateSubtree(const ActionsDAG::Node * node, const Block & allo
         const auto * cur = nodes.top();
         nodes.pop();
 
-        if (cur->type == ActionsDAG::ActionType::INPUT && !allowed_inputs.has(cur->result_name))
+        if (cur->type == ActionsDAG::ActionType::ARRAY_JOIN)
+            return false;
+
+        if (cur->type == ActionsDAG::ActionType::INPUT && allowed_inputs && !allowed_inputs->has(cur->result_name))
             return false;
 
         for (const auto * child : cur->children)
@@ -336,7 +339,7 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
         }
     }
 
-    if (allowed_inputs && !canEvaluateSubtree(node, *allowed_inputs))
+    if (!canEvaluateSubtree(node, allowed_inputs))
         return nullptr;
 
     return node;
diff --git a/tests/queries/0_stateless/01115_prewhere_array_join.reference b/tests/queries/0_stateless/01115_prewhere_array_join.reference
index e69de29bb2d..573541ac970 100644
--- a/tests/queries/0_stateless/01115_prewhere_array_join.reference
+++ b/tests/queries/0_stateless/01115_prewhere_array_join.reference
@@ -0,0 +1 @@
+0
diff --git a/tests/queries/0_stateless/01115_prewhere_array_join.sql b/tests/queries/0_stateless/01115_prewhere_array_join.sql
index e614bdf402b..6ff86636d1d 100644
--- a/tests/queries/0_stateless/01115_prewhere_array_join.sql
+++ b/tests/queries/0_stateless/01115_prewhere_array_join.sql
@@ -5,3 +5,9 @@ INSERT INTO prewhere SELECT 0, randomPrintableASCII(10000) FROM numbers(10000);
 SELECT arrayJoin([light]) != 0 AS cond, length(heavy) FROM prewhere WHERE light != 0 AND cond != 0;
 
 DROP TABLE prewhere;
+
+DROP TABLE IF EXISTS testtable;
+CREATE TABLE testtable (DT Datetime, Label1 String, Value UInt64) ENGINE = MergeTree() PARTITION BY DT ORDER BY Label1;
+INSERT INTO testtable (*) Values (now(), 'app', 1);
+SELECT arrayJoin([0, 1]) AS arrayIdx FROM testtable WHERE arrayIdx = 0;
+DROP TABLE testtable;

From 562027055e2da7366020a7fbda1de656f4cc3df2 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 13 May 2024 21:53:55 +0200
Subject: [PATCH 277/289] Update 03145_non_loaded_projection_backup.sh

---
 tests/queries/0_stateless/03145_non_loaded_projection_backup.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
index b542c9fff9a..7df2118ad0c 100755
--- a/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
+++ b/tests/queries/0_stateless/03145_non_loaded_projection_backup.sh
@@ -39,6 +39,7 @@ $CLICKHOUSE_CLIENT -nm -q "
 set send_logs_level='fatal';
 drop table tp_1;
 restore table tp_1 from Disk('backups', '$backup_id');
+system stop merges tp_1;
 " | grep -o "RESTORED"
 
 $CLICKHOUSE_CLIENT -q "select count() from tp_1;"

From bdc82b61f5d618bf2652f3e9e8ef058aada80745 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Mon, 13 May 2024 23:43:20 +0000
Subject: [PATCH 278/289] Userspace page cache: don't collect stats if cache is
 unused

---
 src/Common/PageCache.cpp | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/Common/PageCache.cpp b/src/Common/PageCache.cpp
index d4598d4683b..3d912a6fd3c 100644
--- a/src/Common/PageCache.cpp
+++ b/src/Common/PageCache.cpp
@@ -198,6 +198,11 @@ size_t PageCache::getPinnedSize() const
 PageCache::MemoryStats PageCache::getResidentSetSize() const
 {
     MemoryStats stats;
+
+    /// Don't spend time on reading smaps if page cache is not used.
+    if (mmaps.empty())
+        return stats;
+
 #ifdef OS_LINUX
     if (use_madv_free)
     {
@@ -258,7 +263,7 @@ PageCache::MemoryStats PageCache::getResidentSetSize() const
                 UInt64 addr = unhexUInt<UInt64>(s.c_str());
                 current_range_is_cache = cache_mmap_addrs.contains(addr);
             }
-            else if (s == "Rss:" || s == "LazyFree")
+            else if (s == "Rss:" || s == "LazyFree:")
             {
                 skip_whitespace();
                 size_t val;

From f83e62b4373c5ee7cbf6708bc9d4a5e39365bc84 Mon Sep 17 00:00:00 2001
From: Leticia Webb <110556185+leticiawebb@users.noreply.github.com>
Date: Mon, 13 May 2024 17:02:23 -0700
Subject: [PATCH 279/289] Security Policy: Add notification process

---
 utils/security-generator/generate_security.py | 31 +++++++++++++++----
 1 file changed, 25 insertions(+), 6 deletions(-)

diff --git a/utils/security-generator/generate_security.py b/utils/security-generator/generate_security.py
index ccf9a82067e..a6017bfadca 100755
--- a/utils/security-generator/generate_security.py
+++ b/utils/security-generator/generate_security.py
@@ -10,21 +10,22 @@ HEADER = """<!--
 the file is autogenerated by utils/security-generator/generate_security.py
 -->
 
-# Security Policy
+# ClickHouse Security Vulnerability Response Policy
 
-## Security Announcements
-Security fixes will be announced by posting them in the [security changelog](https://clickhouse.com/docs/en/whats-new/security-changelog/).
+## Security Change Log and Support
 
-## Scope and Supported Versions
+Details regarding security fixes are publicly reported in our [security changelog](https://clickhouse.com/docs/en/whats-new/security-changelog/). A summary of known security vulnerabilities is shown at the bottom of this page.
 
-The following versions of ClickHouse server are currently being supported with security updates:
+Vulnerability notifications pre-release or during embargo periods are available to open source users and support customers registered for vulnerability alerts. Refer to our [Embargo Policy](#embargo-policy) below.
+
+The following versions of ClickHouse server are currently supported with security updates:
 """
 
 FOOTER = """## Reporting a Vulnerability
 
 We're extremely grateful for security researchers and users that report vulnerabilities to the ClickHouse Open Source Community. All reports are thoroughly investigated by developers.
 
-To report a potential vulnerability in ClickHouse please send the details about it to [security@clickhouse.com](mailto:security@clickhouse.com). We do not offer any financial rewards for reporting issues to us using this method. Alternatively, you can also submit your findings through our public bug bounty program hosted by [Bugcrowd](https://bugcrowd.com/clickhouse) and be rewarded for it as per the program scope and rules of engagement.
+To report a potential vulnerability in ClickHouse please send the details about it through our public bug bounty program hosted by [Bugcrowd](https://bugcrowd.com/clickhouse) and be rewarded for it as per the program scope and rules of engagement.
 
 ### When Should I Report a Vulnerability?
 
@@ -45,6 +46,24 @@ As the security issue moves from triage, to identified fix, to release planning
 ## Public Disclosure Timing
 
 A public disclosure date is negotiated by the ClickHouse maintainers and the bug submitter. We prefer to fully disclose the bug as soon as possible once a user mitigation is available. It is reasonable to delay disclosure when the bug or the fix is not yet fully understood, the solution is not well-tested, or for vendor coordination. The timeframe for disclosure is from immediate (especially if it's already publicly known) to 90 days. For a vulnerability with a straightforward mitigation, we expect the report date to disclosure date to be on the order of 7 days.
+
+## Embargo Policy
+
+Open source users and support customers may subscribe to receive alerts during the embargo period by visiting [https://trust.clickhouse.com](https://trust.clickhouse.com), requesting access and subscribing for alerts. Subscribers agree not to make these notifications public, issue communications, share this information with others, or issue public patches before the disclosure date. Accidental disclsosures must be reported immediately to trust@clickhouse.com. Failure to follow this policy or repeated leaks may result in removal from the subscriber list.
+
+Participation criteria:
+1. Be a current open source user or support customer with a valid corporate email domain (no @gmail.com, @azure.com, etc.).
+1. Sign up to the ClickHouse OSS Trust Center at [https://trust.clickhouse.com](https://trust.clickhouse.com).
+1. Accept the ClickHouse Security Vulnerability Response Policy as outlined above.
+1. Subscribe to ClickHouse OSS Trust Center alerts.
+
+Removal criteria:
+1. Members may be removed for failure to follow this policy or repeated leaks.
+1. Members may be removed for bounced messages (mail delivery failure).
+1. Members may unsubscribe at any time.
+
+Notification process:
+ClickHouse will post notifications within our OSS Trust Center and notify subscribers. Subscribers must log in to the Trust Center to download the notification. The notification will include the timeframe for public disclosure.
 """
 
 
From f6cc1051c162029c316d75feecd6efedf3781289 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Tue, 14 May 2024 00:29:52 +0000
Subject: [PATCH 280/289] Fix

---
 src/Common/PageCache.cpp | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/src/Common/PageCache.cpp b/src/Common/PageCache.cpp
index 3d912a6fd3c..56bd8c1a339 100644
--- a/src/Common/PageCache.cpp
+++ b/src/Common/PageCache.cpp
@@ -199,16 +199,17 @@ PageCache::MemoryStats PageCache::getResidentSetSize() const
 {
     MemoryStats stats;
 
-    /// Don't spend time on reading smaps if page cache is not used.
-    if (mmaps.empty())
-        return stats;
-
 #ifdef OS_LINUX
     if (use_madv_free)
     {
         std::unordered_set<UInt64> cache_mmap_addrs;
         {
             std::lock_guard lock(global_mutex);
+
+            /// Don't spend time on reading smaps if page cache is not used.
+            if (mmaps.empty())
+                return stats;
+
             for (const auto & m : mmaps)
                 cache_mmap_addrs.insert(reinterpret_cast<UInt64>(m.ptr));
         }

From ca4f76b9f7f9feb5f14d3100c6f32181e8f740ac Mon Sep 17 00:00:00 2001
From: skyoct <skyoct@163.com>
Date: Tue, 14 May 2024 09:53:15 +0800
Subject: [PATCH 281/289] update function docs

---
 docs/en/sql-reference/functions/conditional-functions.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/functions/conditional-functions.md b/docs/en/sql-reference/functions/conditional-functions.md
index f19386af9f1..564186fd8db 100644
--- a/docs/en/sql-reference/functions/conditional-functions.md
+++ b/docs/en/sql-reference/functions/conditional-functions.md
@@ -242,12 +242,12 @@ Constrain the return value between A and B.
 **Syntax**
 
 ``` sql
-clamp(x, min, max)
+clamp(value, min, max)
 ```
 
 **Arguments**
 
-- `x` – Input value.
+- `value` – Input value.
 - `min` – Limit the lower bound.
 - `max` – Limit the upper bound.
 

From c4abb42c8a68d72a419e423a388ce894e6ec5855 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Tue, 14 May 2024 11:05:13 +0800
Subject: [PATCH 282/289] add more tests

---
 .../02895_npy_output_format.reference         |  44 ++----
 .../0_stateless/02895_npy_output_format.sh    | 139 +++++++++---------
 2 files changed, 89 insertions(+), 94 deletions(-)

diff --git a/tests/queries/0_stateless/02895_npy_output_format.reference b/tests/queries/0_stateless/02895_npy_output_format.reference
index 77d9b55ca9f..ad3366c2a51 100644
--- a/tests/queries/0_stateless/02895_npy_output_format.reference
+++ b/tests/queries/0_stateless/02895_npy_output_format.reference
@@ -1,38 +1,27 @@
--1
--1
--1
--1
--1
--1
--1
--1
--1
--1
--1
+-- test data types --
 -1
 1
+-1
 1
+-1
 1
+-1
 1
+0
 1
+0
 1
+0
 1
+0
 1
-1
-1
-1
-1
+0.2
 0.1
-0.1
-0.1
-0.01
-0.01
+0.02
 0.01
 npy
 npy
-npy
-npy
-npy
+npynpy
 npy
 array	Int8					
 array	Int16					
@@ -46,15 +35,14 @@ array	Float32
 array	Float64					
 array	String					
 array	String					
-[[[1],[2]],[[3],[4]]]
+-- test nested data types --
 [[[1],[2]],[[3],[4]]]
 [[[1],[2]],[[3],[4]]]
 [[0.1],[0.2]]
 [[0.1],[0.2]]
-[[0.1],[0.2]]
-[['a','bb'],['ccc','dddd']]
-[['a','bb'],['ccc','dddd']]
-[['a','bb'],['ccc','dddd']]
+['a','bb']
+['ccc','dddd']
 array	Array(Array(Array(Int8)))					
 array	Array(Array(Float64))					
-array	Array(Array(String))					
+array	Array(String)					
+-- test exceptions --
diff --git a/tests/queries/0_stateless/02895_npy_output_format.sh b/tests/queries/0_stateless/02895_npy_output_format.sh
index aaf58fe26f6..934c80830c5 100755
--- a/tests/queries/0_stateless/02895_npy_output_format.sh
+++ b/tests/queries/0_stateless/02895_npy_output_format.sh
@@ -10,11 +10,12 @@ mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}/*
 chmod 777 ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 
-${CLICKHOUSE_CLIENT} -n -q "
+${CLICKHOUSE_CLIENT} -n -q --ignore-error "
     DROP DATABASE IF EXISTS npy_output_02895;
     CREATE DATABASE IF NOT EXISTS npy_output_02895;
 
-    CREATE TABLE IF NOT EXISTS npy_output_02895.common
+    SELECT '-- test data types --';
+    CREATE TABLE IF NOT EXISTS npy_output_02895.data_types
     (
         i1 Int8,
         i2 Int16,
@@ -27,84 +28,90 @@ ${CLICKHOUSE_CLIENT} -n -q "
         f4 Float32,
         f8 Float64,
         fs FixedString(10),
-        s String,
-        unknow Int128
+        s String
     ) Engine = MergeTree ORDER BY i1;
 
-    INSERT INTO npy_output_02895.common VALUES (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1), (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1), (-1,-1,-1,-1,1,1,1,1,0.1,0.01,'npy','npy',1);
+    INSERT INTO npy_output_02895.data_types VALUES (1, 1, 1, 1, 1, 1, 1, 1, 0.1, 0.01, 'npy', 'npy'), (-1, -1, -1, -1, 0, 0, 0, 0, 0.2, 0.02, 'npy', 'npynpy');
 
-    SELECT * FROM npy_output_02895.common FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }
-    SELECT unknow FROM npy_output_02895.common FORMAT Npy; -- { clientError BAD_ARGUMENTS }
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int8.npy') SELECT i1 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int16.npy') SELECT i2 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int32.npy') SELECT i4 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int64.npy') SELECT i8 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint8.npy') SELECT u1 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint16.npy') SELECT u2 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint32.npy') SELECT u4 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint64.npy') SELECT u8 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_float32.npy') SELECT f4 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_float64.npy') SELECT f8 FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_fixedstring.npy') SELECT fs FROM npy_output_02895.data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_string.npy') SELECT s FROM npy_output_02895.data_types;
 
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy') SELECT i1 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy') SELECT i2 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy') SELECT i4 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy') SELECT i8 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy') SELECT u1 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy') SELECT u2 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy') SELECT u4 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy') SELECT u8 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy') SELECT f4 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy') SELECT f8 FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy') SELECT fs FROM npy_output_02895.common;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy') SELECT s FROM npy_output_02895.common;
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int8.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int16.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int32.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int64.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint8.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint16.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint32.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint64.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_float32.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_float64.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_fixedstring.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_string.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int8.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int16.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int32.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_int64.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint8.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint16.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint32.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_uint64.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_float32.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_float64.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_fixedstring.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_dtype_string.npy');
 
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy');
-
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int8.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int16.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int32.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_int64.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint8.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint16.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint32.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_uint64.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float32.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_float64.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_fixedstring.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_common_string.npy');
-
-    CREATE TABLE IF NOT EXISTS npy_output_02895.nested
+    SELECT '-- test nested data types --';
+    CREATE TABLE IF NOT EXISTS npy_output_02895.nested_data_types
     (
         i4 Array(Array(Array(Int8))),
         f8 Array(Array(Float64)),
-        s Array(Array(String)),
-        unknow Array(Int128),
-        ragged_1 Array(Array(Int32)),
-        ragged_2 Array(Array(Int32)),
-        empty Array(Array(Int32))
+        s Array(String),
     ) Engine = MergeTree ORDER BY i4;
 
-    INSERT INTO npy_output_02895.nested VALUES ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2], [3, 4]], [[1, 2], [3]], [[],[]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1, 2, 3], [4]], [[1, 2], [3]], [[],[]]), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], [['a', 'bb'], ['ccc', 'dddd']], [1, 2], [[1], [2, 3, 4]], [[1, 2], [3]], [[],[]]);
+    INSERT INTO npy_output_02895.nested_data_types VALUES ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], ['a', 'bb']), ([[[1], [2]], [[3], [4]]], [[0.1], [0.2]], ['ccc', 'dddd']);
 
-    SELECT * FROM npy_output_02895.nested FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }
-    SELECT unknow FROM npy_output_02895.nested FORMAT Npy; -- { clientError BAD_ARGUMENTS }
-    SELECT ragged_1 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
-    SELECT ragged_2 FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
-    SELECT empty FROM npy_output_02895.nested FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_int32.npy') SELECT i4 FROM npy_output_02895.nested_data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_float64.npy') SELECT f8 FROM npy_output_02895.nested_data_types;
+    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_string.npy') SELECT s FROM npy_output_02895.nested_data_types;
 
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy') SELECT i4 FROM npy_output_02895.nested;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy') SELECT f8 FROM npy_output_02895.nested;
-    INSERT INTO TABLE FUNCTION file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy') SELECT s FROM npy_output_02895.nested;
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_int32.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_float64.npy');
+    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_string.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_int32.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_float64.npy');
+    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_dtype_string.npy');
 
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy');
-    SELECT * FROM file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy');
+    SELECT '-- test exceptions --';
+    CREATE TABLE IF NOT EXISTS npy_output_02895.exceptions
+    (
+        unsupported_u UInt256,
+        unsupported_date Date,
+        unsupported_tuple Tuple(Int16, Int16),
+        unsupported_nested_i Array(Int128),
+        ragged_dimention Array(Int16),
+        zero_dimension Array(Int16)
+    ) Engine = MergeTree ORDER BY unsupported_u;
 
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_int32.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_float64.npy');
-    DESC file('${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/02895_nested_string.npy');
+    INSERT INTO npy_output_02895.exceptions VALUES (1, '2019-01-01', (1, 1), [1, 1], [1, 1], []), (0, '2019-01-01', (0, 0), [0, 0], [0], [0]);
+
+    SELECT * FROM npy_output_02895.exceptions FORMAT Npy; -- { clientError TOO_MANY_COLUMNS }
+    SELECT unsupported_u FROM npy_output_02895.exceptions FORMAT Npy; -- { clientError BAD_ARGUMENTS }
+    SELECT unsupported_date FROM npy_output_02895.exceptions FORMAT Npy; -- { clientError BAD_ARGUMENTS }
+    SELECT unsupported_tuple FROM npy_output_02895.exceptions FORMAT Npy; -- { clientError BAD_ARGUMENTS }
+    SELECT unsupported_nested_i FROM npy_output_02895.exceptions FORMAT Npy; -- { clientError BAD_ARGUMENTS }
+    SELECT ragged_dimention FROM npy_output_02895.exceptions FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
+    SELECT zero_dimension FROM npy_output_02895.exceptions FORMAT Npy; -- { clientError ILLEGAL_COLUMN }
 
     DROP DATABASE IF EXISTS npy_output_02895;"
 

From d3f03e9c94786f38087a99f5542a31614bd71db5 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Thu, 2 May 2024 14:21:33 +0000
Subject: [PATCH 283/289] More details about allow_experimental_join_condition

---
 docs/en/sql-reference/statements/select/join.md | 10 +++++++++-
 src/Planner/PlannerJoins.cpp                    |  4 ++--
 2 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/docs/en/sql-reference/statements/select/join.md b/docs/en/sql-reference/statements/select/join.md
index 4ef407a4d13..34c6016235a 100644
--- a/docs/en/sql-reference/statements/select/join.md
+++ b/docs/en/sql-reference/statements/select/join.md
@@ -151,6 +151,14 @@ Result:
 
 Query with `INNER` type of a join and conditions with `OR` and `AND`:
 
+:::note
+
+By default, non-equal conditions are supported as long as they use columns from the same table.
+For example, `t1.a = t2.key AND t1.b > 0 AND t2.b > t2.c`, because `t1.b > 0` uses columns only from `t1` and `t2.b > t2.c` uses columns only from `t2`.
+However, you can try experimental support for conditions like `t1.a = t2.key AND t1.b > t2.key`, check out section below for more details.
+
+:::
+
 ``` sql
 SELECT a, b, val FROM t1 INNER JOIN t2 ON t1.a = t2.key OR t1.b = t2.key AND t2.val > 3;
 ```
@@ -165,7 +173,7 @@ Result:
 └───┴────┴─────┘
 ```
 
-## [experimental] Join with inequality conditions
+## [experimental] Join with inequality conditions for columns from different tables
 
 :::note
 This feature is experimental. To use it, set `allow_experimental_join_condition` to 1 in your configuration files or by using the `SET` command:
diff --git a/src/Planner/PlannerJoins.cpp b/src/Planner/PlannerJoins.cpp
index bd8940b96d8..c410b04f209 100644
--- a/src/Planner/PlannerJoins.cpp
+++ b/src/Planner/PlannerJoins.cpp
@@ -328,7 +328,7 @@ void buildJoinClause(
             {
                 throw Exception(
                     ErrorCodes::INVALID_JOIN_ON_EXPRESSION,
-                    "JOIN {} join expression contains column from left and right table",
+                    "JOIN {} join expression contains column from left and right table, you may try experimental support of this feature by `SET allow_experimental_join_condition = 1`",
                     join_node.formatASTForErrorMessage());
             }
         }
@@ -363,7 +363,7 @@ void buildJoinClause(
             {
                 throw Exception(
                     ErrorCodes::INVALID_JOIN_ON_EXPRESSION,
-                    "JOIN {} join expression contains column from left and right table",
+                    "JOIN {} join expression contains column from left and right table, you may try experimental support of this feature by `SET allow_experimental_join_condition = 1`",
                     join_node.formatASTForErrorMessage());
             }
         }

From 7a7002529bc245cbd5202cd0a65287074ae177b8 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 14 May 2024 09:54:22 +0000
Subject: [PATCH 284/289] Fix a bug in resolving matcher inside lambda inside
 ARRAY JOIN

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp            |  2 +-
 .../0_stateless/02374_analyzer_array_join.reference  | 12 ++++++++++++
 .../0_stateless/02374_analyzer_array_join.sql        | 12 ++++++++++++
 3 files changed, 25 insertions(+), 1 deletion(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index e20ff4ab909..d1882301705 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -4589,7 +4589,7 @@ QueryAnalyzer::QueryTreeNodesWithNames QueryAnalyzer::resolveUnqualifiedMatcher(
 
     for (auto & table_expression : table_expressions_stack)
     {
-        bool table_expression_in_resolve_process = scope.table_expressions_in_resolve_process.contains(table_expression.get());
+        bool table_expression_in_resolve_process = nearest_query_scope->table_expressions_in_resolve_process.contains(table_expression.get());
 
         if (auto * array_join_node = table_expression->as<ArrayJoinNode>())
         {
diff --git a/tests/queries/0_stateless/02374_analyzer_array_join.reference b/tests/queries/0_stateless/02374_analyzer_array_join.reference
index 28859f715b3..6dd384c7d9c 100644
--- a/tests/queries/0_stateless/02374_analyzer_array_join.reference
+++ b/tests/queries/0_stateless/02374_analyzer_array_join.reference
@@ -108,3 +108,15 @@ ARRAY JOIN value_array_array_inner_element AS value_array_array_inner_inner_elem
 0	Value	[[1,2,3],[4,5,6]]	[4,5,6]	[4,5,6]	4
 0	Value	[[1,2,3],[4,5,6]]	[4,5,6]	[4,5,6]	5
 0	Value	[[1,2,3],[4,5,6]]	[4,5,6]	[4,5,6]	6
+SELECT '--';
+--
+SELECT 1 FROM system.one ARRAY JOIN arrayMap(x -> ignore(*), []);
+SELECT arrayFilter(x -> notEmpty(concat(x, 'hello')), [''])
+FROM system.one
+ARRAY JOIN
+    [0] AS elem,
+    arrayMap(x -> concat(x, ignore(ignore(toLowCardinality('03147_parquet_memory_tracking.parquet'), 37, 37, toUInt128(37), 37, 37, toLowCardinality(37), 37), 8, ignore(ignore(1., 36, 8, 8)), *), 'hello'), ['']) AS unused
+WHERE NOT ignore(elem)
+GROUP BY
+    sum(ignore(ignore(ignore(1., 1, 36, 8, 8), ignore(52, 37, 37, '03147_parquet_memory_tracking.parquet', 37, 37, toUInt256(37), 37, 37, toNullable(37), 37, 37), 1., 1, 36, 8, 8), emptyArrayToSingle(arrayMap(x -> toString(x), arrayMap(x -> nullIf(x, 2), arrayJoin([[1]])))))) IGNORE NULLS,
+    modulo(toLowCardinality('03147_parquet_memory_tracking.parquet'), number, toLowCardinality(3)); -- { serverError UNKNOWN_IDENTIFIER }
diff --git a/tests/queries/0_stateless/02374_analyzer_array_join.sql b/tests/queries/0_stateless/02374_analyzer_array_join.sql
index 8ebfdef349c..bc4bb6616c1 100644
--- a/tests/queries/0_stateless/02374_analyzer_array_join.sql
+++ b/tests/queries/0_stateless/02374_analyzer_array_join.sql
@@ -65,6 +65,18 @@ SELECT id, value, value_array_array, value_array_array_inner_element, value_arra
 FROM test_table ARRAY JOIN value_array_array AS value_array_array_inner_element
 ARRAY JOIN value_array_array_inner_element AS value_array_array_inner_inner_element;
 
+SELECT '--';
+SELECT 1 FROM system.one ARRAY JOIN arrayMap(x -> ignore(*), []);
+SELECT arrayFilter(x -> notEmpty(concat(x, 'hello')), [''])
+FROM system.one
+ARRAY JOIN
+    [0] AS elem,
+    arrayMap(x -> concat(x, ignore(ignore(toLowCardinality('03147_parquet_memory_tracking.parquet'), 37, 37, toUInt128(37), 37, 37, toLowCardinality(37), 37), 8, ignore(ignore(1., 36, 8, 8)), *), 'hello'), ['']) AS unused
+WHERE NOT ignore(elem)
+GROUP BY
+    sum(ignore(ignore(ignore(1., 1, 36, 8, 8), ignore(52, 37, 37, '03147_parquet_memory_tracking.parquet', 37, 37, toUInt256(37), 37, 37, toNullable(37), 37, 37), 1., 1, 36, 8, 8), emptyArrayToSingle(arrayMap(x -> toString(x), arrayMap(x -> nullIf(x, 2), arrayJoin([[1]])))))) IGNORE NULLS,
+    modulo(toLowCardinality('03147_parquet_memory_tracking.parquet'), number, toLowCardinality(3)); -- { serverError UNKNOWN_IDENTIFIER }
+
 -- { echoOff }
 
 DROP TABLE test_table;

From 4013195a64d82de4fc1206178e3334b759032e46 Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Tue, 14 May 2024 12:53:31 +0200
Subject: [PATCH 285/289] remove unused cancel_requests method

---
 src/Common/CaresPTRResolver.cpp | 5 -----
 src/Common/CaresPTRResolver.h   | 2 --
 2 files changed, 7 deletions(-)

diff --git a/src/Common/CaresPTRResolver.cpp b/src/Common/CaresPTRResolver.cpp
index 0261f4a130f..df456c9cfbd 100644
--- a/src/Common/CaresPTRResolver.cpp
+++ b/src/Common/CaresPTRResolver.cpp
@@ -173,11 +173,6 @@ namespace DB
         return true;
     }
 
-    void CaresPTRResolver::cancel_requests(ares_channel channel)
-    {
-        ares_cancel(channel);
-    }
-
     std::span<pollfd> CaresPTRResolver::get_readable_sockets(int * sockets, pollfd * pollfd, ares_channel channel)
     {
         int sockets_bitmask = ares_getsock(channel, sockets, ARES_GETSOCK_MAXNUM);
diff --git a/src/Common/CaresPTRResolver.h b/src/Common/CaresPTRResolver.h
index 24a5e422ca8..95194e0d5ce 100644
--- a/src/Common/CaresPTRResolver.h
+++ b/src/Common/CaresPTRResolver.h
@@ -44,8 +44,6 @@ namespace DB
     private:
         bool wait_and_process(ares_channel channel);
 
-        void cancel_requests(ares_channel channel);
-
         void resolve(const std::string & ip, std::unordered_set<std::string> & response, ares_channel channel);
 
         void resolve_v6(const std::string & ip, std::unordered_set<std::string> & response, ares_channel channel);

From 30515e2202fbcc1b15485fed898a64fd24e91038 Mon Sep 17 00:00:00 2001
From: Max K <maxkaynov@gmail.com>
Date: Tue, 14 May 2024 13:07:17 +0200
Subject: [PATCH 286/289] CI: remove Cancel and Debus wf as redundant

---
 .github/workflows/backport_branches.yml     |  6 ++++++
 .github/workflows/cancel.yml                | 19 -----------------
 .github/workflows/debug.yml                 | 11 ----------
 .github/workflows/nightly.yml               |  5 ++---
 .github/workflows/pull_request.yml          |  5 +++++
 .github/workflows/pull_request_approved.yml | 23 ---------------------
 6 files changed, 13 insertions(+), 56 deletions(-)
 delete mode 100644 .github/workflows/cancel.yml
 delete mode 100644 .github/workflows/debug.yml
 delete mode 100644 .github/workflows/pull_request_approved.yml

diff --git a/.github/workflows/backport_branches.yml b/.github/workflows/backport_branches.yml
index 2a98722414b..b0380b939bb 100644
--- a/.github/workflows/backport_branches.yml
+++ b/.github/workflows/backport_branches.yml
@@ -9,6 +9,12 @@ on: # yamllint disable-line rule:truthy
   push:
     branches:
       - 'backport/**'
+
+# Cancel the previous wf run in PRs.
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}
+  cancel-in-progress: true
+
 jobs:
   RunConfig:
     runs-on: [self-hosted, style-checker-aarch64]
diff --git a/.github/workflows/cancel.yml b/.github/workflows/cancel.yml
deleted file mode 100644
index 3c2be767ad2..00000000000
--- a/.github/workflows/cancel.yml
+++ /dev/null
@@ -1,19 +0,0 @@
-name: Cancel
-
-env:
-  # Force the stdout and stderr streams to be unbuffered
-  PYTHONUNBUFFERED: 1
-
-on: # yamllint disable-line rule:truthy
-  workflow_run:
-    workflows: ["PullRequestCI", "ReleaseBranchCI", "DocsCheck", "BackportPR"]
-    types:
-      - requested
-jobs:
-  cancel:
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - uses: styfle/cancel-workflow-action@0.9.1
-        with:
-          all_but_latest: true
-          workflow_id: ${{ github.event.workflow.id }}
diff --git a/.github/workflows/debug.yml b/.github/workflows/debug.yml
deleted file mode 100644
index 5abed268ecd..00000000000
--- a/.github/workflows/debug.yml
+++ /dev/null
@@ -1,11 +0,0 @@
-# The CI for each commit, prints envs and content of GITHUB_EVENT_PATH
-name: Debug
-
-'on':
-  [push, pull_request, pull_request_review, release, workflow_dispatch, workflow_call]
-
-jobs:
-  DebugInfo:
-    runs-on: ubuntu-latest
-    steps:
-    - uses: hmarr/debug-action@f7318c783045ac39ed9bb497e22ce835fdafbfe6
diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
index 515236bb826..3e1c5576e7d 100644
--- a/.github/workflows/nightly.yml
+++ b/.github/workflows/nightly.yml
@@ -10,14 +10,13 @@ env:
   workflow_dispatch:
 
 jobs:
-  Debug:
-    # The task for having a preserved ENV and event.json for later investigation
-    uses: ./.github/workflows/debug.yml
   RunConfig:
     runs-on: [self-hosted, style-checker-aarch64]
     outputs:
       data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
+      - name: DebugInfo
+        uses: hmarr/debug-action@f7318c783045ac39ed9bb497e22ce835fdafbfe6
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index a6e369ae0e6..9f16e32707e 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -14,6 +14,11 @@ on:  # yamllint disable-line rule:truthy
     branches:
       - master
 
+# Cancel the previous wf run in PRs.
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}
+  cancel-in-progress: true
+
 jobs:
   RunConfig:
     runs-on: [self-hosted, style-checker-aarch64]
diff --git a/.github/workflows/pull_request_approved.yml b/.github/workflows/pull_request_approved.yml
deleted file mode 100644
index 3de4978ad68..00000000000
--- a/.github/workflows/pull_request_approved.yml
+++ /dev/null
@@ -1,23 +0,0 @@
-name: PullRequestApprovedCI
-
-env:
-  # Force the stdout and stderr streams to be unbuffered
-  PYTHONUNBUFFERED: 1
-
-on:  # yamllint disable-line rule:truthy
-  pull_request_review:
-    types:
-      - submitted
-
-jobs:
-  MergeOnApproval:
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Merge approved PR
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 merge_pr.py --check-approved

From c229175bc3be3d5446b9bfbcad5af501cfc1f0cd Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 14 May 2024 16:24:59 +0200
Subject: [PATCH 287/289] fix typo

---
 .github/PULL_REQUEST_TEMPLATE.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/PULL_REQUEST_TEMPLATE.md b/.github/PULL_REQUEST_TEMPLATE.md
index 950e672272a..3e0131a388a 100644
--- a/.github/PULL_REQUEST_TEMPLATE.md
+++ b/.github/PULL_REQUEST_TEMPLATE.md
@@ -85,4 +85,4 @@ At a minimum, the following information should be added (but add more as needed)
 - [ ] <!---batch_2--> 3
 - [ ] <!---batch_3--> 4
 
-<details>
+</details>

From 5db1286fff55a8efd252d8732bc2ce8b2f9ba253 Mon Sep 17 00:00:00 2001
From: Leticia Webb <110556185+leticiawebb@users.noreply.github.com>
Date: Tue, 14 May 2024 08:35:17 -0700
Subject: [PATCH 288/289] Update utils/security-generator/generate_security.py
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: Raúl Marín <git@rmr.ninja>
---
 utils/security-generator/generate_security.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/utils/security-generator/generate_security.py b/utils/security-generator/generate_security.py
index a6017bfadca..4ccdcd350d3 100755
--- a/utils/security-generator/generate_security.py
+++ b/utils/security-generator/generate_security.py
@@ -49,7 +49,7 @@ A public disclosure date is negotiated by the ClickHouse maintainers and the bug
 
 ## Embargo Policy
 
-Open source users and support customers may subscribe to receive alerts during the embargo period by visiting [https://trust.clickhouse.com](https://trust.clickhouse.com), requesting access and subscribing for alerts. Subscribers agree not to make these notifications public, issue communications, share this information with others, or issue public patches before the disclosure date. Accidental disclsosures must be reported immediately to trust@clickhouse.com. Failure to follow this policy or repeated leaks may result in removal from the subscriber list.
+Open source users and support customers may subscribe to receive alerts during the embargo period by visiting [https://trust.clickhouse.com/?product=clickhouseoss](https://trust.clickhouse.com/?product=clickhouseoss), requesting access and subscribing for alerts. Subscribers agree not to make these notifications public, issue communications, share this information with others, or issue public patches before the disclosure date. Accidental disclsosures must be reported immediately to trust@clickhouse.com. Failure to follow this policy or repeated leaks may result in removal from the subscriber list.
 
 Participation criteria:
 1. Be a current open source user or support customer with a valid corporate email domain (no @gmail.com, @azure.com, etc.).

From 7bf66dea26e1105e31d037576e88871a9bb65042 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 14 May 2024 17:38:58 +0200
Subject: [PATCH 289/289] Update utils/security-generator/generate_security.py

---
 utils/security-generator/generate_security.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/utils/security-generator/generate_security.py b/utils/security-generator/generate_security.py
index 4ccdcd350d3..2b37e28257a 100755
--- a/utils/security-generator/generate_security.py
+++ b/utils/security-generator/generate_security.py
@@ -49,7 +49,7 @@ A public disclosure date is negotiated by the ClickHouse maintainers and the bug
 
 ## Embargo Policy
 
-Open source users and support customers may subscribe to receive alerts during the embargo period by visiting [https://trust.clickhouse.com/?product=clickhouseoss](https://trust.clickhouse.com/?product=clickhouseoss), requesting access and subscribing for alerts. Subscribers agree not to make these notifications public, issue communications, share this information with others, or issue public patches before the disclosure date. Accidental disclsosures must be reported immediately to trust@clickhouse.com. Failure to follow this policy or repeated leaks may result in removal from the subscriber list.
+Open source users and support customers may subscribe to receive alerts during the embargo period by visiting [https://trust.clickhouse.com/?product=clickhouseoss](https://trust.clickhouse.com/?product=clickhouseoss), requesting access and subscribing for alerts. Subscribers agree not to make these notifications public, issue communications, share this information with others, or issue public patches before the disclosure date. Accidental disclosures must be reported immediately to trust@clickhouse.com. Failure to follow this policy or repeated leaks may result in removal from the subscriber list.
 
 Participation criteria:
 1. Be a current open source user or support customer with a valid corporate email domain (no @gmail.com, @azure.com, etc.).